nerugm-pt-pl10-0 / trainer_state.json
apwic's picture
End of training
3feb98d verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 0.8392817974090576,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9688,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.0879120879120879,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.26666666666666666,
"eval_PERSON_recall": 0.05263157894736842,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.0,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.0,
"eval_TIME_recall": 0.0,
"eval_loss": 0.5576337575912476,
"eval_overall_accuracy": 0.8432778489116517,
"eval_overall_f1": 0.042666666666666665,
"eval_overall_precision": 0.21621621621621623,
"eval_overall_recall": 0.023668639053254437,
"eval_runtime": 0.3335,
"eval_samples_per_second": 560.647,
"eval_steps_per_second": 8.994,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.1076773405075073,
"learning_rate": 4.9e-05,
"loss": 0.4767,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.288659793814433,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5,
"eval_LOCATION_recall": 0.2028985507246377,
"eval_ORGANIZATION_f1": 0.07058823529411765,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.1111111111111111,
"eval_ORGANIZATION_recall": 0.05172413793103448,
"eval_PERSON_f1": 0.5936739659367396,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.47104247104247104,
"eval_PERSON_recall": 0.8026315789473685,
"eval_QUANTITY_f1": 0.11111111111111112,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.125,
"eval_QUANTITY_recall": 0.1,
"eval_TIME_f1": 0.523076923076923,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.4722222222222222,
"eval_TIME_recall": 0.5862068965517241,
"eval_loss": 0.31268012523651123,
"eval_overall_accuracy": 0.8991037131882202,
"eval_overall_f1": 0.44662921348314605,
"eval_overall_precision": 0.42513368983957217,
"eval_overall_recall": 0.47041420118343197,
"eval_runtime": 0.3348,
"eval_samples_per_second": 558.483,
"eval_steps_per_second": 8.96,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 1.2600445747375488,
"learning_rate": 4.85e-05,
"loss": 0.2969,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.6303030303030303,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.5416666666666666,
"eval_LOCATION_recall": 0.7536231884057971,
"eval_ORGANIZATION_f1": 0.4605263157894736,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.3723404255319149,
"eval_ORGANIZATION_recall": 0.603448275862069,
"eval_PERSON_f1": 0.8085106382978723,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.751412429378531,
"eval_PERSON_recall": 0.875,
"eval_QUANTITY_f1": 0.7027027027027029,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5909090909090909,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7301587301587301,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6764705882352942,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.22261539101600647,
"eval_overall_accuracy": 0.9275288092189501,
"eval_overall_f1": 0.6871008939974458,
"eval_overall_precision": 0.604494382022472,
"eval_overall_recall": 0.7958579881656804,
"eval_runtime": 0.333,
"eval_samples_per_second": 561.501,
"eval_steps_per_second": 9.008,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.1735649108886719,
"learning_rate": 4.8e-05,
"loss": 0.2125,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.7346938775510203,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6923076923076923,
"eval_LOCATION_recall": 0.782608695652174,
"eval_ORGANIZATION_f1": 0.5354330708661417,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.4927536231884058,
"eval_ORGANIZATION_recall": 0.5862068965517241,
"eval_PERSON_f1": 0.8288288288288289,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.7624309392265194,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.6944444444444444,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5952380952380952,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7076923076923076,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6388888888888888,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.17351830005645752,
"eval_overall_accuracy": 0.9400768245838669,
"eval_overall_f1": 0.7365591397849461,
"eval_overall_precision": 0.6748768472906403,
"eval_overall_recall": 0.8106508875739645,
"eval_runtime": 0.3365,
"eval_samples_per_second": 555.787,
"eval_steps_per_second": 8.916,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.4631017446517944,
"learning_rate": 4.75e-05,
"loss": 0.1759,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.6762589928057554,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.6714285714285714,
"eval_LOCATION_recall": 0.6811594202898551,
"eval_ORGANIZATION_f1": 0.6056338028169014,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5119047619047619,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8466257668711656,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.7931034482758621,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.7164179104477612,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8275862068965517,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.14357861876487732,
"eval_overall_accuracy": 0.9475032010243278,
"eval_overall_f1": 0.7540983606557377,
"eval_overall_precision": 0.700507614213198,
"eval_overall_recall": 0.8165680473372781,
"eval_runtime": 0.3351,
"eval_samples_per_second": 558.08,
"eval_steps_per_second": 8.953,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 0.8950690627098083,
"learning_rate": 4.7e-05,
"loss": 0.1548,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8840579710144928,
"eval_ORGANIZATION_f1": 0.6811594202898551,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5875,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8518518518518517,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8023255813953488,
"eval_PERSON_recall": 0.9078947368421053,
"eval_QUANTITY_f1": 0.7142857142857143,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.625,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.14464175701141357,
"eval_overall_accuracy": 0.952112676056338,
"eval_overall_f1": 0.7866666666666666,
"eval_overall_precision": 0.7160194174757282,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3323,
"eval_samples_per_second": 562.696,
"eval_steps_per_second": 9.027,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 0.48694196343421936,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1452,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.8289473684210527,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6870229007633589,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6164383561643836,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.875,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8333333333333334,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.6153846153846154,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.14724624156951904,
"eval_overall_accuracy": 0.9510883482714468,
"eval_overall_f1": 0.7967698519515478,
"eval_overall_precision": 0.7308641975308642,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3323,
"eval_samples_per_second": 562.777,
"eval_steps_per_second": 9.029,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.39879658818244934,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1368,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.8378378378378378,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7848101265822784,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7142857142857144,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6097560975609756,
"eval_ORGANIZATION_recall": 0.8620689655172413,
"eval_PERSON_f1": 0.8722741433021807,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8284023668639053,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.6376811594202898,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.55,
"eval_TIME_recall": 0.7586206896551724,
"eval_loss": 0.1397438496351242,
"eval_overall_accuracy": 0.9539052496798975,
"eval_overall_f1": 0.8026845637583893,
"eval_overall_precision": 0.7346437346437347,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3334,
"eval_samples_per_second": 560.876,
"eval_steps_per_second": 8.998,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.2802802324295044,
"learning_rate": 4.55e-05,
"loss": 0.1278,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.8258064516129032,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7441860465116279,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.5950413223140496,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5714285714285714,
"eval_ORGANIZATION_recall": 0.6206896551724138,
"eval_PERSON_f1": 0.8623853211009175,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8057142857142857,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.6571428571428573,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.5609756097560976,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.14592860639095306,
"eval_overall_accuracy": 0.9528809218950064,
"eval_overall_f1": 0.7800269905533064,
"eval_overall_precision": 0.71712158808933,
"eval_overall_recall": 0.8550295857988166,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.31,
"eval_steps_per_second": 8.973,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 1.4159973859786987,
"learning_rate": 4.5e-05,
"loss": 0.1202,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7999999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7209302325581395,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6614173228346457,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6086956521739131,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.877742946708464,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8383233532934131,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.6944444444444444,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5952380952380952,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8064516129032258,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.13962122797966003,
"eval_overall_accuracy": 0.9559539052496799,
"eval_overall_f1": 0.8,
"eval_overall_precision": 0.7405541561712846,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3332,
"eval_samples_per_second": 561.16,
"eval_steps_per_second": 9.003,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.0556025505065918,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1166,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.8552631578947367,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7831325301204819,
"eval_LOCATION_recall": 0.9420289855072463,
"eval_ORGANIZATION_f1": 0.6515151515151516,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.581081081081081,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.88125,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8392857142857143,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.6944444444444444,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5952380952380952,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.13871203362941742,
"eval_overall_accuracy": 0.9556978233034571,
"eval_overall_f1": 0.8054054054054053,
"eval_overall_precision": 0.7412935323383084,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3363,
"eval_samples_per_second": 556.023,
"eval_steps_per_second": 8.92,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.1935970783233643,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1108,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.5641025641025641,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.559322033898305,
"eval_ORGANIZATION_recall": 0.5689655172413793,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.13067495822906494,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8062234794908061,
"eval_overall_precision": 0.7723577235772358,
"eval_overall_recall": 0.8431952662721893,
"eval_runtime": 0.3341,
"eval_samples_per_second": 559.688,
"eval_steps_per_second": 8.979,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.38182273507118225,
"learning_rate": 4.35e-05,
"loss": 0.1052,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.8476821192052981,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7804878048780488,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.71875,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6571428571428571,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8952380952380953,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8650306748466258,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.13124220073223114,
"eval_overall_accuracy": 0.9613316261203585,
"eval_overall_f1": 0.8282548476454293,
"eval_overall_precision": 0.7786458333333334,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3361,
"eval_samples_per_second": 556.458,
"eval_steps_per_second": 8.927,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.8100732564926147,
"learning_rate": 4.3e-05,
"loss": 0.104,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6991869918699186,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6615384615384615,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9085173501577286,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8727272727272727,
"eval_PERSON_recall": 0.9473684210526315,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7419354838709677,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.696969696969697,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.13739244639873505,
"eval_overall_accuracy": 0.9608194622279129,
"eval_overall_f1": 0.8284518828451882,
"eval_overall_precision": 0.783641160949868,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3335,
"eval_samples_per_second": 560.761,
"eval_steps_per_second": 8.996,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.0627801418304443,
"learning_rate": 4.25e-05,
"loss": 0.0963,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.8366013071895425,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7619047619047619,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6610169491525424,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.6724137931034483,
"eval_PERSON_f1": 0.9102564102564101,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8875,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.6233766233766233,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5106382978723404,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.13979628682136536,
"eval_overall_accuracy": 0.9572343149807938,
"eval_overall_f1": 0.8116343490304708,
"eval_overall_precision": 0.7630208333333334,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.3344,
"eval_samples_per_second": 559.247,
"eval_steps_per_second": 8.972,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 0.8222811222076416,
"learning_rate": 4.2e-05,
"loss": 0.0952,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.8311688311688311,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7529411764705882,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7343749999999999,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6714285714285714,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.9067524115755626,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.676056338028169,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.14147908985614777,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8287292817679558,
"eval_overall_precision": 0.7772020725388601,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3348,
"eval_samples_per_second": 558.612,
"eval_steps_per_second": 8.962,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.7422318458557129,
"learning_rate": 4.15e-05,
"loss": 0.0902,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7000000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5975609756097561,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.6315789473684211,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5217391304347826,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7540983606557378,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.71875,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.14226044714450836,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8097165991902834,
"eval_overall_precision": 0.7444168734491315,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.424,
"eval_steps_per_second": 8.975,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.5720771551132202,
"learning_rate": 4.1e-05,
"loss": 0.0919,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6976744186046512,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9113924050632912,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8780487804878049,
"eval_PERSON_recall": 0.9473684210526315,
"eval_QUANTITY_f1": 0.676056338028169,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7301587301587301,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6764705882352942,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.14349369704723358,
"eval_overall_accuracy": 0.9623559539052496,
"eval_overall_f1": 0.8275862068965517,
"eval_overall_precision": 0.7751937984496124,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3339,
"eval_samples_per_second": 560.088,
"eval_steps_per_second": 8.985,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 1.00640070438385,
"learning_rate": 4.05e-05,
"loss": 0.0864,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6885245901639345,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.65625,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8719512195121951,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.64,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5333333333333333,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7796610169491527,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.14329810440540314,
"eval_overall_accuracy": 0.9582586427656851,
"eval_overall_f1": 0.8205841446453407,
"eval_overall_precision": 0.7742782152230971,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.338,
"eval_samples_per_second": 553.255,
"eval_steps_per_second": 8.876,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.7463036179542542,
"learning_rate": 4e-05,
"loss": 0.0853,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7230769230769231,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6527777777777778,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.9137380191693291,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8881987577639752,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.7575757575757577,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7540983606557378,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.71875,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.13515153527259827,
"eval_overall_accuracy": 0.963124199743918,
"eval_overall_f1": 0.8431372549019608,
"eval_overall_precision": 0.800531914893617,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3312,
"eval_samples_per_second": 564.613,
"eval_steps_per_second": 9.058,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 0.4474703073501587,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0782,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.8322147651006713,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.775,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.696969696969697,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6216216216216216,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8719512195121951,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1520513892173767,
"eval_overall_accuracy": 0.9574903969270167,
"eval_overall_f1": 0.8241758241758241,
"eval_overall_precision": 0.7692307692307693,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3358,
"eval_samples_per_second": 556.946,
"eval_steps_per_second": 8.935,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.46933385729789734,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0778,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.8533333333333333,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7901234567901234,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7259259259259259,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.8952380952380953,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8650306748466258,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.14189890027046204,
"eval_overall_accuracy": 0.9618437900128041,
"eval_overall_f1": 0.8308115543328748,
"eval_overall_precision": 0.7763496143958869,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.3349,
"eval_samples_per_second": 558.354,
"eval_steps_per_second": 8.958,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 0.5191448330879211,
"learning_rate": 3.85e-05,
"loss": 0.0751,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8513513513513514,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6976744186046512,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1431107521057129,
"eval_overall_accuracy": 0.9600512163892445,
"eval_overall_f1": 0.8243430152143846,
"eval_overall_precision": 0.7740259740259741,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3347,
"eval_samples_per_second": 558.691,
"eval_steps_per_second": 8.963,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.5136590003967285,
"learning_rate": 3.8e-05,
"loss": 0.0761,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6935483870967741,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6515151515151515,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9079365079365079,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.7500000000000001,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7058823529411765,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1410786360502243,
"eval_overall_accuracy": 0.9633802816901409,
"eval_overall_f1": 0.8394366197183097,
"eval_overall_precision": 0.8010752688172043,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3473,
"eval_samples_per_second": 538.469,
"eval_steps_per_second": 8.639,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.8224151134490967,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0718,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6923076923076923,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9079365079365079,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.64,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5333333333333333,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7301587301587301,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6764705882352942,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.15752357244491577,
"eval_overall_accuracy": 0.9577464788732394,
"eval_overall_f1": 0.8164383561643835,
"eval_overall_precision": 0.7602040816326531,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3326,
"eval_samples_per_second": 562.261,
"eval_steps_per_second": 9.02,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 1.1950877904891968,
"learning_rate": 3.7e-05,
"loss": 0.0706,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8551724137931034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7213114754098361,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6875,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.9166666666666667,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.89375,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.14247971773147583,
"eval_overall_accuracy": 0.9623559539052496,
"eval_overall_f1": 0.8389830508474576,
"eval_overall_precision": 0.8027027027027027,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3335,
"eval_samples_per_second": 560.748,
"eval_steps_per_second": 8.996,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 0.48883256316185,
"learning_rate": 3.65e-05,
"loss": 0.0675,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7101449275362319,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6125,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.890282131661442,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8502994011976048,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.6857142857142857,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.16071684658527374,
"eval_overall_accuracy": 0.9559539052496799,
"eval_overall_f1": 0.819538670284939,
"eval_overall_precision": 0.7568922305764411,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.3357,
"eval_samples_per_second": 557.057,
"eval_steps_per_second": 8.937,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 5.45798397064209,
"learning_rate": 3.6e-05,
"loss": 0.0692,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.688,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6417910447761194,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7301587301587301,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6764705882352942,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.14975115656852722,
"eval_overall_accuracy": 0.9592829705505762,
"eval_overall_f1": 0.8205841446453407,
"eval_overall_precision": 0.7742782152230971,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3351,
"eval_samples_per_second": 558.088,
"eval_steps_per_second": 8.953,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.3084903359413147,
"learning_rate": 3.55e-05,
"loss": 0.0663,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.84,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7777777777777778,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7000000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5975609756097561,
"eval_ORGANIZATION_recall": 0.8448275862068966,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.148148775100708,
"eval_overall_accuracy": 0.9592829705505762,
"eval_overall_f1": 0.8201634877384196,
"eval_overall_precision": 0.76010101010101,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.66,
"eval_steps_per_second": 9.011,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 1.554962396621704,
"learning_rate": 3.5e-05,
"loss": 0.0642,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6612903225806452,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6212121212121212,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.889589905362776,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8545454545454545,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8253968253968254,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7878787878787878,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.14457598328590393,
"eval_overall_accuracy": 0.963124199743918,
"eval_overall_f1": 0.8338028169014083,
"eval_overall_precision": 0.7956989247311828,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3355,
"eval_samples_per_second": 557.403,
"eval_steps_per_second": 8.942,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.40657302737236023,
"learning_rate": 3.45e-05,
"loss": 0.0602,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.65625,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1596260815858841,
"eval_overall_accuracy": 0.9590268886043534,
"eval_overall_f1": 0.8189415041782729,
"eval_overall_precision": 0.7736842105263158,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3328,
"eval_samples_per_second": 561.9,
"eval_steps_per_second": 9.014,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.3220694363117218,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0618,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7258064516129032,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6818181818181818,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.676056338028169,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5853658536585366,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7540983606557378,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.71875,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.15103064477443695,
"eval_overall_accuracy": 0.9605633802816902,
"eval_overall_f1": 0.82336578581363,
"eval_overall_precision": 0.7769028871391076,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.336,
"eval_samples_per_second": 556.607,
"eval_steps_per_second": 8.93,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.0746521949768066,
"learning_rate": 3.35e-05,
"loss": 0.0587,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6976744186046512,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6338028169014085,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.9050632911392406,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8719512195121951,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.15125295519828796,
"eval_overall_accuracy": 0.9636363636363636,
"eval_overall_f1": 0.840782122905028,
"eval_overall_precision": 0.7962962962962963,
"eval_overall_recall": 0.8905325443786982,
"eval_runtime": 0.3377,
"eval_samples_per_second": 553.74,
"eval_steps_per_second": 8.884,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 1.5852210521697998,
"learning_rate": 3.3e-05,
"loss": 0.0575,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.8435374149659864,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7948717948717948,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.7175572519083969,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6438356164383562,
"eval_ORGANIZATION_recall": 0.8103448275862069,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.6857142857142857,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.696969696969697,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6216216216216216,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.17214131355285645,
"eval_overall_accuracy": 0.9574903969270167,
"eval_overall_f1": 0.8136986301369863,
"eval_overall_precision": 0.7576530612244898,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.332,
"eval_samples_per_second": 563.205,
"eval_steps_per_second": 9.035,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.709221601486206,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0568,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.736,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6865671641791045,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.889589905362776,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8545454545454545,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.6956521739130435,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6153846153846154,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7666666666666667,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7419354838709677,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.16309089958667755,
"eval_overall_accuracy": 0.9605633802816902,
"eval_overall_f1": 0.8312412831241283,
"eval_overall_precision": 0.7862796833773087,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3342,
"eval_samples_per_second": 559.545,
"eval_steps_per_second": 8.977,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 0.5662766098976135,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.058,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.8671328671328672,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8378378378378378,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.711111111111111,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6233766233766234,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9079365079365079,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.15275219082832336,
"eval_overall_accuracy": 0.9618437900128041,
"eval_overall_f1": 0.8412256267409471,
"eval_overall_precision": 0.7947368421052632,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.388,
"eval_steps_per_second": 8.974,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.11498302221298218,
"learning_rate": 3.15e-05,
"loss": 0.0542,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6875,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6285714285714286,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1606374979019165,
"eval_overall_accuracy": 0.9597951344430218,
"eval_overall_f1": 0.8272980501392758,
"eval_overall_precision": 0.781578947368421,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.334,
"eval_samples_per_second": 559.858,
"eval_steps_per_second": 8.982,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.5296043157577515,
"learning_rate": 3.1e-05,
"loss": 0.0543,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8456375838926175,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7875,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7058823529411765,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6153846153846154,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5714285714285714,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.16339102387428284,
"eval_overall_accuracy": 0.9582586427656851,
"eval_overall_f1": 0.8207934336525308,
"eval_overall_precision": 0.7633587786259542,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3345,
"eval_samples_per_second": 559.005,
"eval_steps_per_second": 8.968,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 0.7791297435760498,
"learning_rate": 3.05e-05,
"loss": 0.0545,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6929133858267716,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6376811594202898,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8853503184713376,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.78125,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7352941176470589,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.15971286594867706,
"eval_overall_accuracy": 0.9590268886043534,
"eval_overall_f1": 0.8302945301542777,
"eval_overall_precision": 0.7893333333333333,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3358,
"eval_samples_per_second": 556.857,
"eval_steps_per_second": 8.934,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 1.3748724460601807,
"learning_rate": 3e-05,
"loss": 0.0522,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.8571428571428572,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8076923076923077,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8059701492537312,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.15032222867012024,
"eval_overall_accuracy": 0.9626120358514725,
"eval_overall_f1": 0.8366197183098592,
"eval_overall_precision": 0.7983870967741935,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3322,
"eval_samples_per_second": 562.995,
"eval_steps_per_second": 9.032,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.5511608719825745,
"learning_rate": 2.95e-05,
"loss": 0.0484,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6984126984126984,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7575757575757577,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7540983606557378,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.71875,
"eval_TIME_recall": 0.7931034482758621,
"eval_loss": 0.16514161229133606,
"eval_overall_accuracy": 0.9592829705505762,
"eval_overall_f1": 0.8263305322128851,
"eval_overall_precision": 0.7845744680851063,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3352,
"eval_samples_per_second": 557.858,
"eval_steps_per_second": 8.95,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.6805091500282288,
"learning_rate": 2.9e-05,
"loss": 0.0472,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.8671328671328672,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8378378378378378,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6984126984126984,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8924050632911392,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.16605274379253387,
"eval_overall_accuracy": 0.9600512163892445,
"eval_overall_f1": 0.8321579689703809,
"eval_overall_precision": 0.7951482479784366,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.686,
"eval_steps_per_second": 9.011,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 3.199406147003174,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0498,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7040000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6567164179104478,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.9067524115755626,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8059701492537312,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.155135378241539,
"eval_overall_accuracy": 0.9628681177976952,
"eval_overall_f1": 0.8422535211267606,
"eval_overall_precision": 0.803763440860215,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3322,
"eval_samples_per_second": 562.861,
"eval_steps_per_second": 9.03,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 1.2136147022247314,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.0474,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7154471544715447,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.676923076923077,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8867924528301887,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1694120317697525,
"eval_overall_accuracy": 0.9600512163892445,
"eval_overall_f1": 0.8314606741573034,
"eval_overall_precision": 0.7914438502673797,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3337,
"eval_samples_per_second": 560.411,
"eval_steps_per_second": 8.991,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.1127651929855347,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0483,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8551724137931034,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8157894736842105,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.6929133858267716,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6376811594202898,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.6388888888888888,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.5476190476190477,
"eval_QUANTITY_recall": 0.7666666666666667,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.17468813061714172,
"eval_overall_accuracy": 0.954673495518566,
"eval_overall_f1": 0.8138888888888889,
"eval_overall_precision": 0.7670157068062827,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.3348,
"eval_samples_per_second": 558.469,
"eval_steps_per_second": 8.959,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.21913494169712067,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.045,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.8513513513513514,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.7974683544303798,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6942148760330579,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7272727272727273,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6486486486486487,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1735159456729889,
"eval_overall_accuracy": 0.9577464788732394,
"eval_overall_f1": 0.8200836820083682,
"eval_overall_precision": 0.7757255936675461,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3358,
"eval_samples_per_second": 556.961,
"eval_steps_per_second": 8.935,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.8087287545204163,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.0431,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6829268292682927,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6461538461538462,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8860759493670887,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7164179104477612,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.17915095388889313,
"eval_overall_accuracy": 0.9585147247119078,
"eval_overall_f1": 0.8207282913165266,
"eval_overall_precision": 0.7792553191489362,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.3356,
"eval_samples_per_second": 557.259,
"eval_steps_per_second": 8.94,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 1.3942605257034302,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0424,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.8648648648648648,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.810126582278481,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7419354838709677,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.696969696969697,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1734819859266281,
"eval_overall_accuracy": 0.9605633802816902,
"eval_overall_f1": 0.8340306834030683,
"eval_overall_precision": 0.7889182058047494,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.335,
"eval_samples_per_second": 558.27,
"eval_steps_per_second": 8.956,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.8996381759643555,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0426,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7441860465116279,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.676056338028169,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.8867924528301887,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8181818181818182,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.75,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.17559018731117249,
"eval_overall_accuracy": 0.9597951344430218,
"eval_overall_f1": 0.8381742738589212,
"eval_overall_precision": 0.787012987012987,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.775,
"eval_steps_per_second": 9.012,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 0.22222945094108582,
"learning_rate": 2.5e-05,
"loss": 0.0412,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6548672566371682,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6727272727272727,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.16795222461223602,
"eval_overall_accuracy": 0.9597951344430218,
"eval_overall_f1": 0.8295454545454545,
"eval_overall_precision": 0.7978142076502732,
"eval_overall_recall": 0.863905325443787,
"eval_runtime": 0.3341,
"eval_samples_per_second": 559.727,
"eval_steps_per_second": 8.98,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.7834493517875671,
"learning_rate": 2.45e-05,
"loss": 0.0407,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.870748299319728,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8205128205128205,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6557377049180328,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.6896551724137931,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.17565281689167023,
"eval_overall_accuracy": 0.9595390524967989,
"eval_overall_f1": 0.8286516853932584,
"eval_overall_precision": 0.7887700534759359,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3349,
"eval_samples_per_second": 558.379,
"eval_steps_per_second": 8.958,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.5259361863136292,
"learning_rate": 2.4e-05,
"loss": 0.0421,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7142857142857142,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6617647058823529,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.18448342382907867,
"eval_overall_accuracy": 0.9587708066581306,
"eval_overall_f1": 0.83008356545961,
"eval_overall_precision": 0.7842105263157895,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3359,
"eval_samples_per_second": 556.686,
"eval_steps_per_second": 8.931,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 1.3698176145553589,
"learning_rate": 2.35e-05,
"loss": 0.0415,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7142857142857142,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6617647058823529,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.180740624666214,
"eval_overall_accuracy": 0.9603072983354674,
"eval_overall_f1": 0.8379888268156425,
"eval_overall_precision": 0.7936507936507936,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3346,
"eval_samples_per_second": 558.915,
"eval_steps_per_second": 8.967,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 0.6899826526641846,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0378,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6615384615384615,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5972222222222222,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8059701492537312,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1903461366891861,
"eval_overall_accuracy": 0.9587708066581306,
"eval_overall_f1": 0.8250000000000001,
"eval_overall_precision": 0.7774869109947644,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3444,
"eval_samples_per_second": 542.946,
"eval_steps_per_second": 8.71,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 1.0006171464920044,
"learning_rate": 2.25e-05,
"loss": 0.0388,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7166666666666668,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6935483870967742,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7164179104477612,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.18361018598079681,
"eval_overall_accuracy": 0.9592829705505762,
"eval_overall_f1": 0.8326300984528833,
"eval_overall_precision": 0.7935656836461126,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3373,
"eval_samples_per_second": 554.414,
"eval_steps_per_second": 8.894,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 0.8649386167526245,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0381,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.688,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6417910447761194,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7647058823529413,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8666666666666667,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.17993959784507751,
"eval_overall_accuracy": 0.9595390524967989,
"eval_overall_f1": 0.8382559774964837,
"eval_overall_precision": 0.7989276139410187,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3352,
"eval_samples_per_second": 557.898,
"eval_steps_per_second": 8.95,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.5134249925613403,
"learning_rate": 2.15e-05,
"loss": 0.0377,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6451612903225807,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6060606060606061,
"eval_ORGANIZATION_recall": 0.6896551724137931,
"eval_PERSON_f1": 0.8797468354430381,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8475609756097561,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.7941176470588235,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7105263157894737,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.7692307692307692,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6944444444444444,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.1980062872171402,
"eval_overall_accuracy": 0.9554417413572344,
"eval_overall_f1": 0.8189415041782729,
"eval_overall_precision": 0.7736842105263158,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3364,
"eval_samples_per_second": 555.829,
"eval_steps_per_second": 8.917,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 1.7326457500457764,
"learning_rate": 2.1e-05,
"loss": 0.0382,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.8671328671328672,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8378378378378378,
"eval_LOCATION_recall": 0.8985507246376812,
"eval_ORGANIZATION_f1": 0.688,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6417910447761194,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7352941176470588,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6578947368421053,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1960817277431488,
"eval_overall_accuracy": 0.9562099871959027,
"eval_overall_f1": 0.8274894810659188,
"eval_overall_precision": 0.7866666666666666,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3347,
"eval_samples_per_second": 558.716,
"eval_steps_per_second": 8.963,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 0.785622239112854,
"learning_rate": 2.05e-05,
"loss": 0.0358,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6984126984126984,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8952380952380953,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8650306748466258,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7536231884057971,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.1875164657831192,
"eval_overall_accuracy": 0.9600512163892445,
"eval_overall_f1": 0.835195530726257,
"eval_overall_precision": 0.791005291005291,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3334,
"eval_samples_per_second": 560.851,
"eval_steps_per_second": 8.998,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 0.8723583221435547,
"learning_rate": 2e-05,
"loss": 0.0355,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.703125,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6428571428571429,
"eval_ORGANIZATION_recall": 0.7758620689655172,
"eval_PERSON_f1": 0.8938906752411576,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.7164179104477612,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6486486486486487,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8196721311475409,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.19338777661323547,
"eval_overall_accuracy": 0.9577464788732394,
"eval_overall_f1": 0.8314606741573034,
"eval_overall_precision": 0.7914438502673797,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3431,
"eval_samples_per_second": 544.973,
"eval_steps_per_second": 8.743,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.1464908123016357,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.037,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6929133858267716,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6376811594202898,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7647058823529413,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.18568746745586395,
"eval_overall_accuracy": 0.9592829705505762,
"eval_overall_f1": 0.829608938547486,
"eval_overall_precision": 0.7857142857142857,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3342,
"eval_samples_per_second": 559.582,
"eval_steps_per_second": 8.977,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.577111542224884,
"learning_rate": 1.9e-05,
"loss": 0.0342,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.671875,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6142857142857143,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8853503184713376,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.19420312345027924,
"eval_overall_accuracy": 0.9564660691421255,
"eval_overall_f1": 0.8184357541899442,
"eval_overall_precision": 0.7751322751322751,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.3361,
"eval_samples_per_second": 556.377,
"eval_steps_per_second": 8.926,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 0.4379956126213074,
"learning_rate": 1.85e-05,
"loss": 0.0349,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6942148760330579,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.8059701492537312,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.18639543652534485,
"eval_overall_accuracy": 0.9603072983354674,
"eval_overall_f1": 0.8450704225352114,
"eval_overall_precision": 0.8064516129032258,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.339,
"eval_samples_per_second": 551.625,
"eval_steps_per_second": 8.85,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 1.331531286239624,
"learning_rate": 1.8e-05,
"loss": 0.0316,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6814814814814815,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5974025974025974,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9144736842105263,
"eval_QUANTITY_f1": 0.7647058823529413,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6842105263157895,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.19557389616966248,
"eval_overall_accuracy": 0.9554417413572344,
"eval_overall_f1": 0.8209366391184573,
"eval_overall_precision": 0.7680412371134021,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3402,
"eval_samples_per_second": 549.599,
"eval_steps_per_second": 8.817,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.3099250793457031,
"learning_rate": 1.75e-05,
"loss": 0.0358,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6808510638297872,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.5783132530120482,
"eval_ORGANIZATION_recall": 0.8275862068965517,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.7575757575757577,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.19938279688358307,
"eval_overall_accuracy": 0.9567221510883482,
"eval_overall_f1": 0.8290013679890562,
"eval_overall_precision": 0.7709923664122137,
"eval_overall_recall": 0.8964497041420119,
"eval_runtime": 0.3388,
"eval_samples_per_second": 551.909,
"eval_steps_per_second": 8.854,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.5862748026847839,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0317,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6559999999999999,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6119402985074627,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.8952380952380953,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8650306748466258,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7058823529411765,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.631578947368421,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.21487130224704742,
"eval_overall_accuracy": 0.9556978233034571,
"eval_overall_f1": 0.8200836820083682,
"eval_overall_precision": 0.7757255936675461,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3359,
"eval_samples_per_second": 556.74,
"eval_steps_per_second": 8.932,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.5351269841194153,
"learning_rate": 1.65e-05,
"loss": 0.0335,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7040000000000001,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6567164179104478,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.9079365079365079,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8773006134969326,
"eval_PERSON_recall": 0.9407894736842105,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.1979534924030304,
"eval_overall_accuracy": 0.9603072983354674,
"eval_overall_f1": 0.8391608391608392,
"eval_overall_precision": 0.7957559681697612,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3372,
"eval_samples_per_second": 554.49,
"eval_steps_per_second": 8.896,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.3918878138065338,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0333,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.688,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6417910447761194,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.889589905362776,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8545454545454545,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7384615384615385,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.1945626586675644,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8222222222222222,
"eval_overall_precision": 0.774869109947644,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3368,
"eval_samples_per_second": 555.197,
"eval_steps_per_second": 8.907,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.9337367415428162,
"learning_rate": 1.55e-05,
"loss": 0.0311,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6991869918699186,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6615384615384615,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.896551724137931,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.19715982675552368,
"eval_overall_accuracy": 0.9605633802816902,
"eval_overall_f1": 0.8470254957507082,
"eval_overall_precision": 0.8125,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3336,
"eval_samples_per_second": 560.63,
"eval_steps_per_second": 8.994,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 1.763173222541809,
"learning_rate": 1.5e-05,
"loss": 0.0314,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7049180327868853,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.671875,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.2073572725057602,
"eval_overall_accuracy": 0.9572343149807938,
"eval_overall_f1": 0.8342696629213484,
"eval_overall_precision": 0.7941176470588235,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.3,
"eval_steps_per_second": 8.973,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.9943879842758179,
"learning_rate": 1.45e-05,
"loss": 0.0317,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.7301587301587301,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6764705882352942,
"eval_ORGANIZATION_recall": 0.7931034482758621,
"eval_PERSON_f1": 0.9044585987261147,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8765432098765432,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7272727272727273,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6486486486486487,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.21239928901195526,
"eval_overall_accuracy": 0.9577464788732394,
"eval_overall_f1": 0.8344923504867873,
"eval_overall_precision": 0.7874015748031497,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3359,
"eval_samples_per_second": 556.631,
"eval_steps_per_second": 8.93,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.39654669165611267,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.0297,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.881118881118881,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8513513513513513,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6379310344827587,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6379310344827587,
"eval_ORGANIZATION_recall": 0.6379310344827587,
"eval_PERSON_f1": 0.9009584664536742,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.2062947303056717,
"eval_overall_accuracy": 0.9567221510883482,
"eval_overall_f1": 0.8233618233618234,
"eval_overall_precision": 0.7939560439560439,
"eval_overall_recall": 0.8550295857988166,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.346,
"eval_steps_per_second": 8.973,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.2321532964706421,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0293,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6825396825396826,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6323529411764706,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9015873015873016,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8711656441717791,
"eval_PERSON_recall": 0.9342105263157895,
"eval_QUANTITY_f1": 0.8059701492537312,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7297297297297297,
"eval_QUANTITY_recall": 0.9,
"eval_TIME_f1": 0.8387096774193549,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7878787878787878,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.20541173219680786,
"eval_overall_accuracy": 0.9603072983354674,
"eval_overall_f1": 0.8435754189944134,
"eval_overall_precision": 0.798941798941799,
"eval_overall_recall": 0.893491124260355,
"eval_runtime": 0.3355,
"eval_samples_per_second": 557.322,
"eval_steps_per_second": 8.941,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 2.329578399658203,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0303,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6176470588235294,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.20924483239650726,
"eval_overall_accuracy": 0.9582586427656851,
"eval_overall_f1": 0.8240223463687152,
"eval_overall_precision": 0.7804232804232805,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3356,
"eval_samples_per_second": 557.229,
"eval_steps_per_second": 8.939,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 0.4096578359603882,
"learning_rate": 1.25e-05,
"loss": 0.0319,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6829268292682927,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6461538461538462,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7384615384615385,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.21165302395820618,
"eval_overall_accuracy": 0.9567221510883482,
"eval_overall_f1": 0.8230337078651686,
"eval_overall_precision": 0.7834224598930482,
"eval_overall_recall": 0.8668639053254438,
"eval_runtime": 0.3352,
"eval_samples_per_second": 557.866,
"eval_steps_per_second": 8.95,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.22333945333957672,
"learning_rate": 1.2e-05,
"loss": 0.0294,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6829268292682927,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6461538461538462,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.20302210748195648,
"eval_overall_accuracy": 0.9577464788732394,
"eval_overall_f1": 0.8258426966292135,
"eval_overall_precision": 0.786096256684492,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3339,
"eval_samples_per_second": 560.02,
"eval_steps_per_second": 8.984,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 0.893441915512085,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0282,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6721311475409836,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.640625,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7936507936507937,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.20604942739009857,
"eval_overall_accuracy": 0.9585147247119078,
"eval_overall_f1": 0.829817158931083,
"eval_overall_precision": 0.7908847184986595,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3381,
"eval_samples_per_second": 553.156,
"eval_steps_per_second": 8.874,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 1.8298670053482056,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0298,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6610169491525424,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.65,
"eval_ORGANIZATION_recall": 0.6724137931034483,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8275862068965517,
"eval_loss": 0.20402812957763672,
"eval_overall_accuracy": 0.9585147247119078,
"eval_overall_f1": 0.8238636363636365,
"eval_overall_precision": 0.7923497267759563,
"eval_overall_recall": 0.8579881656804734,
"eval_runtime": 0.3363,
"eval_samples_per_second": 556.081,
"eval_steps_per_second": 8.921,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.38677918910980225,
"learning_rate": 1.05e-05,
"loss": 0.0296,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6991869918699186,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6615384615384615,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.9009584664536742,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.1978691667318344,
"eval_overall_accuracy": 0.9608194622279129,
"eval_overall_f1": 0.8474576271186441,
"eval_overall_precision": 0.8108108108108109,
"eval_overall_recall": 0.8875739644970414,
"eval_runtime": 0.3358,
"eval_samples_per_second": 556.894,
"eval_steps_per_second": 8.934,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.18261797726154327,
"learning_rate": 1e-05,
"loss": 0.0281,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7107438016528926,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6825396825396826,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2115841805934906,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8389830508474576,
"eval_overall_precision": 0.8027027027027027,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3347,
"eval_samples_per_second": 558.764,
"eval_steps_per_second": 8.964,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 0.5827004909515381,
"learning_rate": 9.5e-06,
"loss": 0.0285,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6721311475409836,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.640625,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7272727272727272,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7692307692307692,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6944444444444444,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.20784814655780792,
"eval_overall_accuracy": 0.9569782330345711,
"eval_overall_f1": 0.8258426966292135,
"eval_overall_precision": 0.786096256684492,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3341,
"eval_samples_per_second": 559.746,
"eval_steps_per_second": 8.98,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 0.163285493850708,
"learning_rate": 9e-06,
"loss": 0.0248,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6612903225806452,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6212121212121212,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7352941176470588,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6410256410256411,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.22002604603767395,
"eval_overall_accuracy": 0.9541613316261204,
"eval_overall_f1": 0.8200836820083682,
"eval_overall_precision": 0.7757255936675461,
"eval_overall_recall": 0.8698224852071006,
"eval_runtime": 0.3337,
"eval_samples_per_second": 560.445,
"eval_steps_per_second": 8.991,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.5999857783317566,
"learning_rate": 8.500000000000002e-06,
"loss": 0.026,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6451612903225806,
"eval_ORGANIZATION_recall": 0.6896551724137931,
"eval_PERSON_f1": 0.8974358974358975,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8524590163934426,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.8125,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.20526228845119476,
"eval_overall_accuracy": 0.9590268886043534,
"eval_overall_f1": 0.8404558404558404,
"eval_overall_precision": 0.8104395604395604,
"eval_overall_recall": 0.8727810650887574,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.768,
"eval_steps_per_second": 9.012,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.8914698362350464,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0267,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6829268292682927,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6461538461538462,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8980891719745223,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.9276315789473685,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7222222222222222,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.20852600038051605,
"eval_overall_accuracy": 0.9585147247119078,
"eval_overall_f1": 0.8359046283309958,
"eval_overall_precision": 0.7946666666666666,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3353,
"eval_samples_per_second": 557.656,
"eval_steps_per_second": 8.946,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.07933935523033142,
"learning_rate": 7.5e-06,
"loss": 0.0256,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6774193548387097,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7222222222222222,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21233612298965454,
"eval_overall_accuracy": 0.9582586427656851,
"eval_overall_f1": 0.8335664335664336,
"eval_overall_precision": 0.7904509283819628,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3363,
"eval_samples_per_second": 556.087,
"eval_steps_per_second": 8.921,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 1.2923147678375244,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0258,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.7,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6774193548387096,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7575757575757577,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7692307692307692,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6944444444444444,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.20847661793231964,
"eval_overall_accuracy": 0.9572343149807938,
"eval_overall_f1": 0.8338028169014083,
"eval_overall_precision": 0.7956989247311828,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3331,
"eval_samples_per_second": 561.331,
"eval_steps_per_second": 9.005,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.8602144718170166,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0278,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6984126984126984,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.7586206896551724,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.7575757575757576,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6756756756756757,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.2143712192773819,
"eval_overall_accuracy": 0.9582586427656851,
"eval_overall_f1": 0.829608938547486,
"eval_overall_precision": 0.7857142857142857,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3343,
"eval_samples_per_second": 559.33,
"eval_steps_per_second": 8.973,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 3.9535341262817383,
"learning_rate": 6e-06,
"loss": 0.0266,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.672,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6268656716417911,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7384615384615385,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6857142857142857,
"eval_QUANTITY_recall": 0.8,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21172450482845306,
"eval_overall_accuracy": 0.9585147247119078,
"eval_overall_f1": 0.8314606741573034,
"eval_overall_precision": 0.7914438502673797,
"eval_overall_recall": 0.8757396449704142,
"eval_runtime": 0.3355,
"eval_samples_per_second": 557.315,
"eval_steps_per_second": 8.941,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 0.6084784865379333,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0277,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6774193548387097,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7222222222222222,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21649378538131714,
"eval_overall_accuracy": 0.9574903969270167,
"eval_overall_f1": 0.8335664335664336,
"eval_overall_precision": 0.7904509283819628,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3329,
"eval_samples_per_second": 561.77,
"eval_steps_per_second": 9.012,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 3.59494686126709,
"learning_rate": 5e-06,
"loss": 0.0263,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6935483870967741,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6515151515151515,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.7692307692307692,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.6944444444444444,
"eval_TIME_recall": 0.8620689655172413,
"eval_loss": 0.21574969589710236,
"eval_overall_accuracy": 0.9572343149807938,
"eval_overall_f1": 0.8284518828451882,
"eval_overall_precision": 0.783641160949868,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.336,
"eval_samples_per_second": 556.623,
"eval_steps_per_second": 8.93,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.6815735697746277,
"learning_rate": 4.5e-06,
"loss": 0.0249,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.8767123287671235,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8311688311688312,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6666666666666666,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6307692307692307,
"eval_ORGANIZATION_recall": 0.7068965517241379,
"eval_PERSON_f1": 0.89171974522293,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.8,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7428571428571429,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21547271311283112,
"eval_overall_accuracy": 0.9574903969270167,
"eval_overall_f1": 0.8342696629213484,
"eval_overall_precision": 0.7941176470588235,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3337,
"eval_samples_per_second": 560.443,
"eval_steps_per_second": 8.991,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.9203242063522339,
"learning_rate": 4.000000000000001e-06,
"loss": 0.026,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.8689655172413793,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8289473684210527,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.688,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6417910447761194,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7575757575757577,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6944444444444444,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21566654741764069,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8342696629213484,
"eval_overall_precision": 0.7941176470588235,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3342,
"eval_samples_per_second": 559.523,
"eval_steps_per_second": 8.976,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 1.3422565460205078,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0246,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6935483870967741,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6515151515151515,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.746268656716418,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.6756756756756757,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21777355670928955,
"eval_overall_accuracy": 0.9574903969270167,
"eval_overall_f1": 0.8319327731092437,
"eval_overall_precision": 0.7898936170212766,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3325,
"eval_samples_per_second": 562.463,
"eval_steps_per_second": 9.023,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.5304462909698486,
"learning_rate": 3e-06,
"loss": 0.0228,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6666666666666667,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6056338028169014,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21389849483966827,
"eval_overall_accuracy": 0.9577464788732394,
"eval_overall_f1": 0.83008356545961,
"eval_overall_precision": 0.7842105263157895,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3334,
"eval_samples_per_second": 560.952,
"eval_steps_per_second": 8.999,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 0.9430941343307495,
"learning_rate": 2.5e-06,
"loss": 0.0239,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.863013698630137,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8181818181818182,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.688,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6417910447761194,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2171957641839981,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8359046283309958,
"eval_overall_precision": 0.7946666666666666,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3342,
"eval_samples_per_second": 559.517,
"eval_steps_per_second": 8.976,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.5671630501747131,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0246,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.882758620689655,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8421052631578947,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6771653543307088,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6231884057971014,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7761194029850748,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7027027027027027,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21604588627815247,
"eval_overall_accuracy": 0.9585147247119078,
"eval_overall_f1": 0.835195530726257,
"eval_overall_precision": 0.791005291005291,
"eval_overall_recall": 0.8846153846153846,
"eval_runtime": 0.3336,
"eval_samples_per_second": 560.484,
"eval_steps_per_second": 8.992,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 2.1864192485809326,
"learning_rate": 1.5e-06,
"loss": 0.0263,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.888888888888889,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.8533333333333334,
"eval_LOCATION_recall": 0.927536231884058,
"eval_ORGANIZATION_f1": 0.6829268292682927,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6461538461538462,
"eval_ORGANIZATION_recall": 0.7241379310344828,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7692307692307692,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7142857142857143,
"eval_QUANTITY_recall": 0.8333333333333334,
"eval_TIME_f1": 0.8253968253968255,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7647058823529411,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2144096940755844,
"eval_overall_accuracy": 0.9585147247119078,
"eval_overall_f1": 0.8389830508474576,
"eval_overall_precision": 0.8027027027027027,
"eval_overall_recall": 0.878698224852071,
"eval_runtime": 0.3344,
"eval_samples_per_second": 559.208,
"eval_steps_per_second": 8.971,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 0.35259944200515747,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0243,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.688,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6417910447761194,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21475861966609955,
"eval_overall_accuracy": 0.9582586427656851,
"eval_overall_f1": 0.8370786516853933,
"eval_overall_precision": 0.7967914438502673,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.3334,
"eval_samples_per_second": 560.934,
"eval_steps_per_second": 8.999,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 1.3611903190612793,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0232,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6935483870967741,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6515151515151515,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.2144315391778946,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8382559774964837,
"eval_overall_precision": 0.7989276139410187,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.334,
"eval_samples_per_second": 559.885,
"eval_steps_per_second": 8.982,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.2549450397491455,
"learning_rate": 0.0,
"loss": 0.0224,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.8749999999999999,
"eval_LOCATION_number": 69,
"eval_LOCATION_precision": 0.84,
"eval_LOCATION_recall": 0.9130434782608695,
"eval_ORGANIZATION_f1": 0.6935483870967741,
"eval_ORGANIZATION_number": 58,
"eval_ORGANIZATION_precision": 0.6515151515151515,
"eval_ORGANIZATION_recall": 0.7413793103448276,
"eval_PERSON_f1": 0.8945686900958467,
"eval_PERSON_number": 152,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9210526315789473,
"eval_QUANTITY_f1": 0.7878787878787877,
"eval_QUANTITY_number": 30,
"eval_QUANTITY_precision": 0.7222222222222222,
"eval_QUANTITY_recall": 0.8666666666666667,
"eval_TIME_f1": 0.8125,
"eval_TIME_number": 29,
"eval_TIME_precision": 0.7428571428571429,
"eval_TIME_recall": 0.896551724137931,
"eval_loss": 0.21471820771694183,
"eval_overall_accuracy": 0.9580025608194622,
"eval_overall_f1": 0.8382559774964837,
"eval_overall_precision": 0.7989276139410187,
"eval_overall_recall": 0.8816568047337278,
"eval_runtime": 0.336,
"eval_samples_per_second": 556.48,
"eval_steps_per_second": 8.927,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5008141811675874.0,
"train_loss": 0.0706503679617396,
"train_runtime": 608.9849,
"train_samples_per_second": 277.018,
"train_steps_per_second": 17.406
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5008141811675874.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}