nerugm-pt-pl5-3 / trainer_state.json
apwic's picture
End of training
caaac5f verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 100.0,
"eval_steps": 500,
"global_step": 10600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 2.6862921714782715,
"learning_rate": 4.9500000000000004e-05,
"loss": 0.9792,
"step": 106
},
{
"epoch": 1.0,
"eval_LOCATION_f1": 0.0,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.0,
"eval_LOCATION_recall": 0.0,
"eval_ORGANIZATION_f1": 0.0,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.0,
"eval_ORGANIZATION_recall": 0.0,
"eval_PERSON_f1": 0.18095238095238095,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.31666666666666665,
"eval_PERSON_recall": 0.12666666666666668,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.06666666666666667,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.5,
"eval_TIME_recall": 0.03571428571428571,
"eval_loss": 0.5512092113494873,
"eval_overall_accuracy": 0.850387972841901,
"eval_overall_f1": 0.09501187648456057,
"eval_overall_precision": 0.2702702702702703,
"eval_overall_recall": 0.05763688760806916,
"eval_runtime": 0.3324,
"eval_samples_per_second": 562.651,
"eval_steps_per_second": 9.026,
"step": 106
},
{
"epoch": 2.0,
"grad_norm": 1.0679957866668701,
"learning_rate": 4.9e-05,
"loss": 0.4837,
"step": 212
},
{
"epoch": 2.0,
"eval_LOCATION_f1": 0.41739130434782606,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5454545454545454,
"eval_LOCATION_recall": 0.3380281690140845,
"eval_ORGANIZATION_f1": 0.019801980198019802,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.027777777777777776,
"eval_ORGANIZATION_recall": 0.015384615384615385,
"eval_PERSON_f1": 0.6831955922865013,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.5821596244131455,
"eval_PERSON_recall": 0.8266666666666667,
"eval_QUANTITY_f1": 0.0,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.0,
"eval_QUANTITY_recall": 0.0,
"eval_TIME_f1": 0.5454545454545454,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.47368421052631576,
"eval_TIME_recall": 0.6428571428571429,
"eval_loss": 0.33068543672561646,
"eval_overall_accuracy": 0.9022793404461688,
"eval_overall_f1": 0.4798850574712644,
"eval_overall_precision": 0.4785100286532951,
"eval_overall_recall": 0.4812680115273775,
"eval_runtime": 0.3251,
"eval_samples_per_second": 575.209,
"eval_steps_per_second": 9.228,
"step": 212
},
{
"epoch": 3.0,
"grad_norm": 0.8312263488769531,
"learning_rate": 4.85e-05,
"loss": 0.3133,
"step": 318
},
{
"epoch": 3.0,
"eval_LOCATION_f1": 0.5306122448979592,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5131578947368421,
"eval_LOCATION_recall": 0.5492957746478874,
"eval_ORGANIZATION_f1": 0.4000000000000001,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.34444444444444444,
"eval_ORGANIZATION_recall": 0.47692307692307695,
"eval_PERSON_f1": 0.7710843373493976,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7032967032967034,
"eval_PERSON_recall": 0.8533333333333334,
"eval_QUANTITY_f1": 0.5194805194805195,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.45454545454545453,
"eval_QUANTITY_recall": 0.6060606060606061,
"eval_TIME_f1": 0.793103448275862,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7666666666666667,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.21400973200798035,
"eval_overall_accuracy": 0.9308923375363725,
"eval_overall_f1": 0.6267880364109232,
"eval_overall_precision": 0.5710900473933649,
"eval_overall_recall": 0.6945244956772334,
"eval_runtime": 0.3261,
"eval_samples_per_second": 573.482,
"eval_steps_per_second": 9.2,
"step": 318
},
{
"epoch": 4.0,
"grad_norm": 1.0169802904129028,
"learning_rate": 4.8e-05,
"loss": 0.2327,
"step": 424
},
{
"epoch": 4.0,
"eval_LOCATION_f1": 0.6436781609195402,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.5436893203883495,
"eval_LOCATION_recall": 0.7887323943661971,
"eval_ORGANIZATION_f1": 0.5590062111801243,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.46875,
"eval_ORGANIZATION_recall": 0.6923076923076923,
"eval_PERSON_f1": 0.8421052631578947,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.7861271676300579,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.5897435897435898,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5111111111111111,
"eval_QUANTITY_recall": 0.696969696969697,
"eval_TIME_f1": 0.7719298245614034,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7586206896551724,
"eval_TIME_recall": 0.7857142857142857,
"eval_loss": 0.17442111670970917,
"eval_overall_accuracy": 0.9408341416100873,
"eval_overall_f1": 0.7112232030264818,
"eval_overall_precision": 0.6322869955156951,
"eval_overall_recall": 0.8126801152737753,
"eval_runtime": 0.3287,
"eval_samples_per_second": 568.904,
"eval_steps_per_second": 9.127,
"step": 424
},
{
"epoch": 5.0,
"grad_norm": 1.3268284797668457,
"learning_rate": 4.75e-05,
"loss": 0.1989,
"step": 530
},
{
"epoch": 5.0,
"eval_LOCATION_f1": 0.7215189873417721,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6551724137931034,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.6493506493506495,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5617977528089888,
"eval_ORGANIZATION_recall": 0.7692307692307693,
"eval_PERSON_f1": 0.8652037617554857,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8165680473372781,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6329113924050633,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5434782608695652,
"eval_QUANTITY_recall": 0.7575757575757576,
"eval_TIME_f1": 0.7796610169491526,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7419354838709677,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.1507454365491867,
"eval_overall_accuracy": 0.9481086323957323,
"eval_overall_f1": 0.7620286085825748,
"eval_overall_precision": 0.6943127962085308,
"eval_overall_recall": 0.8443804034582133,
"eval_runtime": 0.3267,
"eval_samples_per_second": 572.456,
"eval_steps_per_second": 9.184,
"step": 530
},
{
"epoch": 6.0,
"grad_norm": 1.4492706060409546,
"learning_rate": 4.7e-05,
"loss": 0.1782,
"step": 636
},
{
"epoch": 6.0,
"eval_LOCATION_f1": 0.7088607594936709,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6436781609195402,
"eval_LOCATION_recall": 0.7887323943661971,
"eval_ORGANIZATION_f1": 0.6473988439306357,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5185185185185185,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8598130841121495,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8070175438596491,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.6352941176470589,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5192307692307693,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.746268656716418,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6410256410256411,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.17294442653656006,
"eval_overall_accuracy": 0.9425315227934045,
"eval_overall_f1": 0.7512437810945274,
"eval_overall_precision": 0.6608315098468271,
"eval_overall_recall": 0.8703170028818443,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.852,
"eval_steps_per_second": 9.174,
"step": 636
},
{
"epoch": 7.0,
"grad_norm": 2.372952938079834,
"learning_rate": 4.6500000000000005e-05,
"loss": 0.1675,
"step": 742
},
{
"epoch": 7.0,
"eval_LOCATION_f1": 0.7407407407407407,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6593406593406593,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.675,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5684210526315789,
"eval_ORGANIZATION_recall": 0.8307692307692308,
"eval_PERSON_f1": 0.8706624605678233,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8263473053892215,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7179487179487178,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6222222222222222,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1436489075422287,
"eval_overall_accuracy": 0.950533462657614,
"eval_overall_f1": 0.7784891165172856,
"eval_overall_precision": 0.7004608294930875,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3264,
"eval_samples_per_second": 572.836,
"eval_steps_per_second": 9.19,
"step": 742
},
{
"epoch": 8.0,
"grad_norm": 0.5531976222991943,
"learning_rate": 4.600000000000001e-05,
"loss": 0.1523,
"step": 848
},
{
"epoch": 8.0,
"eval_LOCATION_f1": 0.7643312101910827,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6976744186046512,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.6832298136645962,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5729166666666666,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8670886075949367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8253012048192772,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7936507936507937,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7142857142857143,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1423933058977127,
"eval_overall_accuracy": 0.9527158098933075,
"eval_overall_f1": 0.7891332470892625,
"eval_overall_precision": 0.715962441314554,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3281,
"eval_samples_per_second": 570.034,
"eval_steps_per_second": 9.145,
"step": 848
},
{
"epoch": 9.0,
"grad_norm": 1.0425461530685425,
"learning_rate": 4.55e-05,
"loss": 0.148,
"step": 954
},
{
"epoch": 9.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7466666666666668,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6588235294117647,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8690095846645367,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8343558282208589,
"eval_PERSON_recall": 0.9066666666666666,
"eval_QUANTITY_f1": 0.6666666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5777777777777777,
"eval_QUANTITY_recall": 0.7878787878787878,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13000667095184326,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8015873015873015,
"eval_overall_precision": 0.7408312958435208,
"eval_overall_recall": 0.8731988472622478,
"eval_runtime": 0.3275,
"eval_samples_per_second": 571.032,
"eval_steps_per_second": 9.161,
"step": 954
},
{
"epoch": 10.0,
"grad_norm": 0.9898656606674194,
"learning_rate": 4.5e-05,
"loss": 0.1376,
"step": 1060
},
{
"epoch": 10.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7320261437908497,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6363636363636364,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7088607594936709,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6086956521739131,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12935131788253784,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8131578947368422,
"eval_overall_precision": 0.7481840193704601,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3271,
"eval_samples_per_second": 571.762,
"eval_steps_per_second": 9.173,
"step": 1060
},
{
"epoch": 11.0,
"grad_norm": 1.2879328727722168,
"learning_rate": 4.4500000000000004e-05,
"loss": 0.1378,
"step": 1166
},
{
"epoch": 11.0,
"eval_LOCATION_f1": 0.7532467532467533,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6987951807228916,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.728476821192053,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6395348837209303,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12860190868377686,
"eval_overall_accuracy": 0.9565955383123181,
"eval_overall_f1": 0.8063660477453581,
"eval_overall_precision": 0.7469287469287469,
"eval_overall_recall": 0.8760806916426513,
"eval_runtime": 0.3281,
"eval_samples_per_second": 570.029,
"eval_steps_per_second": 9.145,
"step": 1166
},
{
"epoch": 12.0,
"grad_norm": 1.0456236600875854,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.1279,
"step": 1272
},
{
"epoch": 12.0,
"eval_LOCATION_f1": 0.728395061728395,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6483516483516484,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7375,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6210526315789474,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.6865671641791046,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.5897435897435898,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.14702975749969482,
"eval_overall_accuracy": 0.9524733268671193,
"eval_overall_f1": 0.7953667953667953,
"eval_overall_precision": 0.7186046511627907,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.329,
"eval_samples_per_second": 568.322,
"eval_steps_per_second": 9.117,
"step": 1272
},
{
"epoch": 13.0,
"grad_norm": 0.7470729351043701,
"learning_rate": 4.35e-05,
"loss": 0.1257,
"step": 1378
},
{
"epoch": 13.0,
"eval_LOCATION_f1": 0.7763157894736843,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8070175438596492,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7931034482758621,
"eval_TIME_recall": 0.8214285714285714,
"eval_loss": 0.12572742998600006,
"eval_overall_accuracy": 0.9597478176527643,
"eval_overall_f1": 0.823529411764706,
"eval_overall_precision": 0.7680798004987531,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.326,
"eval_samples_per_second": 573.579,
"eval_steps_per_second": 9.202,
"step": 1378
},
{
"epoch": 14.0,
"grad_norm": 1.587265133857727,
"learning_rate": 4.3e-05,
"loss": 0.1211,
"step": 1484
},
{
"epoch": 14.0,
"eval_LOCATION_f1": 0.7643312101910827,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6976744186046512,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8753993610223643,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8404907975460123,
"eval_PERSON_recall": 0.9133333333333333,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.6956521739130435,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.5853658536585366,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12821051478385925,
"eval_overall_accuracy": 0.9565955383123181,
"eval_overall_f1": 0.8031290743155148,
"eval_overall_precision": 0.7333333333333333,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3277,
"eval_samples_per_second": 570.653,
"eval_steps_per_second": 9.155,
"step": 1484
},
{
"epoch": 15.0,
"grad_norm": 1.1898987293243408,
"learning_rate": 4.25e-05,
"loss": 0.1182,
"step": 1590
},
{
"epoch": 15.0,
"eval_LOCATION_f1": 0.794701986754967,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7532467532467532,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.651685393258427,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12380851060152054,
"eval_overall_accuracy": 0.960717749757517,
"eval_overall_f1": 0.8255659121171772,
"eval_overall_precision": 0.7673267326732673,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3297,
"eval_samples_per_second": 567.219,
"eval_steps_per_second": 9.1,
"step": 1590
},
{
"epoch": 16.0,
"grad_norm": 1.2394359111785889,
"learning_rate": 4.2e-05,
"loss": 0.1084,
"step": 1696
},
{
"epoch": 16.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7741935483870968,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7058823529411765,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12522907555103302,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8180610889774237,
"eval_overall_precision": 0.7586206896551724,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3284,
"eval_samples_per_second": 569.484,
"eval_steps_per_second": 9.136,
"step": 1696
},
{
"epoch": 17.0,
"grad_norm": 0.5448505878448486,
"learning_rate": 4.15e-05,
"loss": 0.11,
"step": 1802
},
{
"epoch": 17.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7428571428571429,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6933333333333334,
"eval_ORGANIZATION_recall": 0.8,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.11857786774635315,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8243243243243243,
"eval_overall_precision": 0.7760814249363868,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3269,
"eval_samples_per_second": 572.103,
"eval_steps_per_second": 9.178,
"step": 1802
},
{
"epoch": 18.0,
"grad_norm": 0.928116500377655,
"learning_rate": 4.1e-05,
"loss": 0.105,
"step": 1908
},
{
"epoch": 18.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7402597402597403,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6404494382022472,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.736842105263158,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6511627906976745,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.75,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6666666666666666,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13439632952213287,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8153034300791556,
"eval_overall_precision": 0.7518248175182481,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3276,
"eval_samples_per_second": 570.855,
"eval_steps_per_second": 9.158,
"step": 1908
},
{
"epoch": 19.0,
"grad_norm": 0.6120880246162415,
"learning_rate": 4.05e-05,
"loss": 0.1012,
"step": 2014
},
{
"epoch": 19.0,
"eval_LOCATION_f1": 0.778523489932886,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7435897435897436,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.76,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6705882352941176,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1134907528758049,
"eval_overall_accuracy": 0.9643549951503395,
"eval_overall_f1": 0.8299319727891157,
"eval_overall_precision": 0.7860824742268041,
"eval_overall_recall": 0.8789625360230547,
"eval_runtime": 0.3267,
"eval_samples_per_second": 572.422,
"eval_steps_per_second": 9.183,
"step": 2014
},
{
"epoch": 20.0,
"grad_norm": 0.7189091444015503,
"learning_rate": 4e-05,
"loss": 0.1009,
"step": 2120
},
{
"epoch": 20.0,
"eval_LOCATION_f1": 0.8129032258064516,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.75,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.763888888888889,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6962025316455697,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.887459807073955,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8571428571428571,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.11710327118635178,
"eval_overall_accuracy": 0.9636275460717749,
"eval_overall_f1": 0.8324324324324324,
"eval_overall_precision": 0.7837150127226463,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3264,
"eval_samples_per_second": 572.982,
"eval_steps_per_second": 9.192,
"step": 2120
},
{
"epoch": 21.0,
"grad_norm": 1.2998398542404175,
"learning_rate": 3.9500000000000005e-05,
"loss": 0.0994,
"step": 2226
},
{
"epoch": 21.0,
"eval_LOCATION_f1": 0.7777777777777779,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6923076923076923,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7972027972027972,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7307692307692307,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5957446808510638,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1276998519897461,
"eval_overall_accuracy": 0.9597478176527643,
"eval_overall_f1": 0.8295904887714662,
"eval_overall_precision": 0.7658536585365854,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.3284,
"eval_samples_per_second": 569.448,
"eval_steps_per_second": 9.136,
"step": 2226
},
{
"epoch": 22.0,
"grad_norm": 0.8688408136367798,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.0947,
"step": 2332
},
{
"epoch": 22.0,
"eval_LOCATION_f1": 0.7530864197530862,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6703296703296703,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.759493670886076,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6451612903225806,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.6829268292682927,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5714285714285714,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7619047619047619,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6857142857142857,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14317628741264343,
"eval_overall_accuracy": 0.9536857419980601,
"eval_overall_f1": 0.8067010309278351,
"eval_overall_precision": 0.7296037296037297,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3269,
"eval_samples_per_second": 571.972,
"eval_steps_per_second": 9.176,
"step": 2332
},
{
"epoch": 23.0,
"grad_norm": 1.058230996131897,
"learning_rate": 3.85e-05,
"loss": 0.0922,
"step": 2438
},
{
"epoch": 23.0,
"eval_LOCATION_f1": 0.8025477707006369,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7325581395348837,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8000000000000002,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7567567567567568,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.11902488023042679,
"eval_overall_accuracy": 0.9643549951503395,
"eval_overall_f1": 0.84,
"eval_overall_precision": 0.7816377171215881,
"eval_overall_recall": 0.9077809798270894,
"eval_runtime": 0.3269,
"eval_samples_per_second": 572.066,
"eval_steps_per_second": 9.178,
"step": 2438
},
{
"epoch": 24.0,
"grad_norm": 1.2606264352798462,
"learning_rate": 3.8e-05,
"loss": 0.0917,
"step": 2544
},
{
"epoch": 24.0,
"eval_LOCATION_f1": 0.7530864197530862,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6703296703296703,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7534246575342466,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6790123456790124,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13196653127670288,
"eval_overall_accuracy": 0.9587778855480117,
"eval_overall_f1": 0.8186666666666667,
"eval_overall_precision": 0.7617866004962779,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3273,
"eval_samples_per_second": 571.298,
"eval_steps_per_second": 9.165,
"step": 2544
},
{
"epoch": 25.0,
"grad_norm": 0.8119063973426819,
"learning_rate": 3.7500000000000003e-05,
"loss": 0.0895,
"step": 2650
},
{
"epoch": 25.0,
"eval_LOCATION_f1": 0.7625,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6853932584269663,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7755102040816327,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6951219512195121,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.896774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.86875,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12873846292495728,
"eval_overall_accuracy": 0.9599903006789525,
"eval_overall_f1": 0.8233731739707836,
"eval_overall_precision": 0.7635467980295566,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3259,
"eval_samples_per_second": 573.763,
"eval_steps_per_second": 9.205,
"step": 2650
},
{
"epoch": 26.0,
"grad_norm": 0.6412087082862854,
"learning_rate": 3.7e-05,
"loss": 0.0915,
"step": 2756
},
{
"epoch": 26.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.759493670886076,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6444444444444445,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6363636363636364,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12941302359104156,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8244680851063829,
"eval_overall_precision": 0.7654320987654321,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3264,
"eval_samples_per_second": 572.875,
"eval_steps_per_second": 9.191,
"step": 2756
},
{
"epoch": 27.0,
"grad_norm": 1.1233749389648438,
"learning_rate": 3.65e-05,
"loss": 0.0857,
"step": 2862
},
{
"epoch": 27.0,
"eval_LOCATION_f1": 0.775,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6966292134831461,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7662337662337663,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6629213483146067,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9067524115755627,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.6428571428571428,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.5294117647058824,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.78125,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.6944444444444444,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14580127596855164,
"eval_overall_accuracy": 0.9553831231813773,
"eval_overall_f1": 0.8124191461836998,
"eval_overall_precision": 0.7370892018779343,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.3274,
"eval_samples_per_second": 571.119,
"eval_steps_per_second": 9.162,
"step": 2862
},
{
"epoch": 28.0,
"grad_norm": 2.415337085723877,
"learning_rate": 3.6e-05,
"loss": 0.0846,
"step": 2968
},
{
"epoch": 28.0,
"eval_LOCATION_f1": 0.7837837837837838,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7532467532467533,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7763157894736842,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6781609195402298,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9009584664536742,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8650306748466258,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12516556680202484,
"eval_overall_accuracy": 0.9636275460717749,
"eval_overall_f1": 0.8337801608579088,
"eval_overall_precision": 0.7794486215538847,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3273,
"eval_samples_per_second": 571.332,
"eval_steps_per_second": 9.166,
"step": 2968
},
{
"epoch": 29.0,
"grad_norm": 0.36568284034729004,
"learning_rate": 3.55e-05,
"loss": 0.0828,
"step": 3074
},
{
"epoch": 29.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7361963190184049,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6122448979591837,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7777777777777778,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.717948717948718,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12355955690145493,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8289473684210527,
"eval_overall_precision": 0.7627118644067796,
"eval_overall_recall": 0.9077809798270894,
"eval_runtime": 0.3266,
"eval_samples_per_second": 572.645,
"eval_steps_per_second": 9.187,
"step": 3074
},
{
"epoch": 30.0,
"grad_norm": 2.264235019683838,
"learning_rate": 3.5e-05,
"loss": 0.081,
"step": 3180
},
{
"epoch": 30.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7317073170731707,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6060606060606061,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13108646869659424,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8241469816272966,
"eval_overall_precision": 0.7566265060240964,
"eval_overall_recall": 0.9048991354466859,
"eval_runtime": 0.3263,
"eval_samples_per_second": 573.006,
"eval_steps_per_second": 9.193,
"step": 3180
},
{
"epoch": 31.0,
"grad_norm": 0.646797239780426,
"learning_rate": 3.45e-05,
"loss": 0.0782,
"step": 3286
},
{
"epoch": 31.0,
"eval_LOCATION_f1": 0.7530864197530862,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6703296703296703,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7532467532467532,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.651685393258427,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13420291244983673,
"eval_overall_accuracy": 0.9599903006789525,
"eval_overall_f1": 0.8167539267015707,
"eval_overall_precision": 0.7482014388489209,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.836,
"eval_steps_per_second": 9.174,
"step": 3286
},
{
"epoch": 32.0,
"grad_norm": 0.6615414023399353,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.0812,
"step": 3392
},
{
"epoch": 32.0,
"eval_LOCATION_f1": 0.751592356687898,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.686046511627907,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7483870967741936,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6444444444444445,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12814216315746307,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8174603174603176,
"eval_overall_precision": 0.7555012224938875,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.795,
"eval_steps_per_second": 9.173,
"step": 3392
},
{
"epoch": 33.0,
"grad_norm": 1.0747178792953491,
"learning_rate": 3.35e-05,
"loss": 0.0759,
"step": 3498
},
{
"epoch": 33.0,
"eval_LOCATION_f1": 0.7612903225806451,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.782051282051282,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6703296703296703,
"eval_ORGANIZATION_recall": 0.9384615384615385,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12921784818172455,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8269484808454426,
"eval_overall_precision": 0.7634146341463415,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3274,
"eval_samples_per_second": 571.082,
"eval_steps_per_second": 9.162,
"step": 3498
},
{
"epoch": 34.0,
"grad_norm": 0.9548816084861755,
"learning_rate": 3.3e-05,
"loss": 0.0755,
"step": 3604
},
{
"epoch": 34.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7916666666666667,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7215189873417721,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.12423999607563019,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8279569892473119,
"eval_overall_precision": 0.7758186397984886,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3276,
"eval_samples_per_second": 570.793,
"eval_steps_per_second": 9.157,
"step": 3604
},
{
"epoch": 35.0,
"grad_norm": 0.42714256048202515,
"learning_rate": 3.2500000000000004e-05,
"loss": 0.0739,
"step": 3710
},
{
"epoch": 35.0,
"eval_LOCATION_f1": 0.751592356687898,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.686046511627907,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7453416149068324,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.625,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.7868852459016394,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7272727272727273,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.13675132393836975,
"eval_overall_accuracy": 0.9568380213385063,
"eval_overall_f1": 0.8141361256544503,
"eval_overall_precision": 0.7458033573141487,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3266,
"eval_samples_per_second": 572.553,
"eval_steps_per_second": 9.185,
"step": 3710
},
{
"epoch": 36.0,
"grad_norm": 1.520427942276001,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.0754,
"step": 3816
},
{
"epoch": 36.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7672955974842768,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.648936170212766,
"eval_ORGANIZATION_recall": 0.9384615384615385,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1319383829832077,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8289473684210527,
"eval_overall_precision": 0.7627118644067796,
"eval_overall_recall": 0.9077809798270894,
"eval_runtime": 0.3273,
"eval_samples_per_second": 571.333,
"eval_steps_per_second": 9.166,
"step": 3816
},
{
"epoch": 37.0,
"grad_norm": 0.7817038893699646,
"learning_rate": 3.15e-05,
"loss": 0.0703,
"step": 3922
},
{
"epoch": 37.0,
"eval_LOCATION_f1": 0.7530864197530862,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6703296703296703,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7402597402597403,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6404494382022472,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8980891719745222,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8597560975609756,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7012987012987013,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6136363636363636,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1478222757577896,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8093994778067884,
"eval_overall_precision": 0.7398568019093079,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3267,
"eval_samples_per_second": 572.415,
"eval_steps_per_second": 9.183,
"step": 3922
},
{
"epoch": 38.0,
"grad_norm": 0.6990446448326111,
"learning_rate": 3.1e-05,
"loss": 0.0735,
"step": 4028
},
{
"epoch": 38.0,
"eval_LOCATION_f1": 0.8181818181818181,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7590361445783133,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.879746835443038,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8373493975903614,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.12963485717773438,
"eval_overall_accuracy": 0.9624151309408342,
"eval_overall_f1": 0.8249336870026525,
"eval_overall_precision": 0.7641277641277642,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.9,
"eval_steps_per_second": 9.175,
"step": 4028
},
{
"epoch": 39.0,
"grad_norm": 1.1196815967559814,
"learning_rate": 3.05e-05,
"loss": 0.0718,
"step": 4134
},
{
"epoch": 39.0,
"eval_LOCATION_f1": 0.7402597402597403,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6867469879518072,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7375,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6210526315789474,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9038461538461539,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8703703703703703,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7671232876712328,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13455747067928314,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8190224570673712,
"eval_overall_precision": 0.7560975609756098,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3273,
"eval_samples_per_second": 571.347,
"eval_steps_per_second": 9.166,
"step": 4134
},
{
"epoch": 40.0,
"grad_norm": 0.904691219329834,
"learning_rate": 3e-05,
"loss": 0.0694,
"step": 4240
},
{
"epoch": 40.0,
"eval_LOCATION_f1": 0.7733333333333333,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7341772151898734,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7333333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6470588235294118,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7733333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6904761904761905,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1319706290960312,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8186666666666667,
"eval_overall_precision": 0.7617866004962779,
"eval_overall_recall": 0.8847262247838616,
"eval_runtime": 0.3287,
"eval_samples_per_second": 568.914,
"eval_steps_per_second": 9.127,
"step": 4240
},
{
"epoch": 41.0,
"grad_norm": 0.4921020567417145,
"learning_rate": 2.95e-05,
"loss": 0.0693,
"step": 4346
},
{
"epoch": 41.0,
"eval_LOCATION_f1": 0.7435897435897436,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6823529411764706,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7515923566878981,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6413043478260869,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.912621359223301,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8867924528301887,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7733333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6904761904761905,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14422298967838287,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8253968253968255,
"eval_overall_precision": 0.7628361858190709,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3268,
"eval_samples_per_second": 572.269,
"eval_steps_per_second": 9.181,
"step": 4346
},
{
"epoch": 42.0,
"grad_norm": 0.17059876024723053,
"learning_rate": 2.9e-05,
"loss": 0.0675,
"step": 4452
},
{
"epoch": 42.0,
"eval_LOCATION_f1": 0.7763157894736843,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7283950617283951,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7866666666666665,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6941176470588235,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7466666666666666,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6666666666666666,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13859502971172333,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8266666666666667,
"eval_overall_precision": 0.7692307692307693,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3267,
"eval_samples_per_second": 572.428,
"eval_steps_per_second": 9.183,
"step": 4452
},
{
"epoch": 43.0,
"grad_norm": 0.5693849325180054,
"learning_rate": 2.8499999999999998e-05,
"loss": 0.0672,
"step": 4558
},
{
"epoch": 43.0,
"eval_LOCATION_f1": 0.7692307692307694,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7058823529411765,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13775749504566193,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8243064729194188,
"eval_overall_precision": 0.7609756097560976,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.326,
"eval_samples_per_second": 573.554,
"eval_steps_per_second": 9.201,
"step": 4558
},
{
"epoch": 44.0,
"grad_norm": 0.5870493650436401,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.067,
"step": 4664
},
{
"epoch": 44.0,
"eval_LOCATION_f1": 0.7866666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7468354430379747,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8853503184713376,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8475609756097561,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8285714285714285,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7837837837837838,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13134053349494934,
"eval_overall_accuracy": 0.9626576139670223,
"eval_overall_f1": 0.8315508021390374,
"eval_overall_precision": 0.7755610972568578,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.903,
"eval_steps_per_second": 9.175,
"step": 4664
},
{
"epoch": 45.0,
"grad_norm": 1.1741827726364136,
"learning_rate": 2.7500000000000004e-05,
"loss": 0.0656,
"step": 4770
},
{
"epoch": 45.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7200000000000001,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6428571428571429,
"eval_QUANTITY_recall": 0.8181818181818182,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13948975503444672,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8320000000000001,
"eval_overall_precision": 0.7741935483870968,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3274,
"eval_samples_per_second": 571.187,
"eval_steps_per_second": 9.163,
"step": 4770
},
{
"epoch": 46.0,
"grad_norm": 0.8152003288269043,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.0656,
"step": 4876
},
{
"epoch": 46.0,
"eval_LOCATION_f1": 0.7662337662337662,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7108433734939759,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7450980392156863,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6477272727272727,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13262593746185303,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8222811671087533,
"eval_overall_precision": 0.7616707616707616,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3275,
"eval_samples_per_second": 571.056,
"eval_steps_per_second": 9.161,
"step": 4876
},
{
"epoch": 47.0,
"grad_norm": 0.9389750361442566,
"learning_rate": 2.6500000000000004e-05,
"loss": 0.062,
"step": 4982
},
{
"epoch": 47.0,
"eval_LOCATION_f1": 0.7421383647798742,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6704545454545454,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7450980392156863,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6477272727272727,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8924050632911392,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8493975903614458,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7567567567567567,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6829268292682927,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.806451612903226,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7352941176470589,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15109694004058838,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.81151832460733,
"eval_overall_precision": 0.7434052757793765,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3278,
"eval_samples_per_second": 570.556,
"eval_steps_per_second": 9.153,
"step": 4982
},
{
"epoch": 48.0,
"grad_norm": 1.3758347034454346,
"learning_rate": 2.6000000000000002e-05,
"loss": 0.0638,
"step": 5088
},
{
"epoch": 48.0,
"eval_LOCATION_f1": 0.7875000000000001,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7078651685393258,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8853503184713376,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8475609756097561,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7733333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6904761904761905,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1447124034166336,
"eval_overall_accuracy": 0.9597478176527643,
"eval_overall_f1": 0.8221343873517787,
"eval_overall_precision": 0.7572815533980582,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.823,
"eval_steps_per_second": 9.174,
"step": 5088
},
{
"epoch": 49.0,
"grad_norm": 0.8612605333328247,
"learning_rate": 2.5500000000000003e-05,
"loss": 0.0601,
"step": 5194
},
{
"epoch": 49.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7567567567567568,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6746987951807228,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1353224217891693,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8288770053475935,
"eval_overall_precision": 0.773067331670823,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3281,
"eval_samples_per_second": 569.939,
"eval_steps_per_second": 9.143,
"step": 5194
},
{
"epoch": 50.0,
"grad_norm": 1.3004350662231445,
"learning_rate": 2.5e-05,
"loss": 0.0604,
"step": 5300
},
{
"epoch": 50.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7549668874172185,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6627906976744186,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1338462084531784,
"eval_overall_accuracy": 0.9619301648884578,
"eval_overall_f1": 0.8315508021390374,
"eval_overall_precision": 0.7755610972568578,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3278,
"eval_samples_per_second": 570.522,
"eval_steps_per_second": 9.153,
"step": 5300
},
{
"epoch": 51.0,
"grad_norm": 0.871790885925293,
"learning_rate": 2.45e-05,
"loss": 0.0582,
"step": 5406
},
{
"epoch": 51.0,
"eval_LOCATION_f1": 0.7654320987654322,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6813186813186813,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7619047619047619,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6829268292682927,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.819672131147541,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7575757575757576,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.13927897810935974,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8302387267904509,
"eval_overall_precision": 0.769041769041769,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3272,
"eval_samples_per_second": 571.49,
"eval_steps_per_second": 9.168,
"step": 5406
},
{
"epoch": 52.0,
"grad_norm": 0.7292200326919556,
"learning_rate": 2.4e-05,
"loss": 0.0608,
"step": 5512
},
{
"epoch": 52.0,
"eval_LOCATION_f1": 0.7631578947368421,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7295597484276729,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6170212765957447,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8789808917197452,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8414634146341463,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.1517271101474762,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8153034300791556,
"eval_overall_precision": 0.7518248175182481,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3279,
"eval_samples_per_second": 570.258,
"eval_steps_per_second": 9.149,
"step": 5512
},
{
"epoch": 53.0,
"grad_norm": 0.8021668791770935,
"learning_rate": 2.35e-05,
"loss": 0.0575,
"step": 5618
},
{
"epoch": 53.0,
"eval_LOCATION_f1": 0.7466666666666666,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7088607594936709,
"eval_LOCATION_recall": 0.7887323943661971,
"eval_ORGANIZATION_f1": 0.7361963190184049,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6122448979591837,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8832807570977917,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8383233532934131,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.15490397810935974,
"eval_overall_accuracy": 0.9556256062075654,
"eval_overall_f1": 0.8125819134993448,
"eval_overall_precision": 0.7451923076923077,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3281,
"eval_samples_per_second": 570.008,
"eval_steps_per_second": 9.145,
"step": 5618
},
{
"epoch": 54.0,
"grad_norm": 1.3401607275009155,
"learning_rate": 2.3000000000000003e-05,
"loss": 0.0585,
"step": 5724
},
{
"epoch": 54.0,
"eval_LOCATION_f1": 0.7402597402597403,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6867469879518072,
"eval_LOCATION_recall": 0.8028169014084507,
"eval_ORGANIZATION_f1": 0.7305389221556887,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.5980392156862745,
"eval_ORGANIZATION_recall": 0.9384615384615385,
"eval_PERSON_f1": 0.8825396825396825,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8424242424242424,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8813559322033899,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8387096774193549,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.16088581085205078,
"eval_overall_accuracy": 0.9541707080504365,
"eval_overall_f1": 0.811443433029909,
"eval_overall_precision": 0.7393364928909952,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3275,
"eval_samples_per_second": 570.964,
"eval_steps_per_second": 9.16,
"step": 5724
},
{
"epoch": 55.0,
"grad_norm": 0.5186824202537537,
"learning_rate": 2.25e-05,
"loss": 0.0571,
"step": 5830
},
{
"epoch": 55.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.75,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6551724137931034,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7733333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6904761904761905,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14577339589595795,
"eval_overall_accuracy": 0.9599903006789525,
"eval_overall_f1": 0.8282290279627165,
"eval_overall_precision": 0.7698019801980198,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3267,
"eval_samples_per_second": 572.313,
"eval_steps_per_second": 9.181,
"step": 5830
},
{
"epoch": 56.0,
"grad_norm": 1.0186669826507568,
"learning_rate": 2.2000000000000003e-05,
"loss": 0.0574,
"step": 5936
},
{
"epoch": 56.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.90032154340836,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8695652173913043,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8333333333333334,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.78125,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14299847185611725,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8308921438082557,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3268,
"eval_samples_per_second": 572.282,
"eval_steps_per_second": 9.181,
"step": 5936
},
{
"epoch": 57.0,
"grad_norm": 0.6867424845695496,
"learning_rate": 2.15e-05,
"loss": 0.0549,
"step": 6042
},
{
"epoch": 57.0,
"eval_LOCATION_f1": 0.779874213836478,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7045454545454546,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7808219178082192,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7037037037037037,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8917197452229298,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8536585365853658,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.14952713251113892,
"eval_overall_accuracy": 0.9616876818622696,
"eval_overall_f1": 0.8335552596537948,
"eval_overall_precision": 0.7747524752475248,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3268,
"eval_samples_per_second": 572.296,
"eval_steps_per_second": 9.181,
"step": 6042
},
{
"epoch": 58.0,
"grad_norm": 0.42461711168289185,
"learning_rate": 2.1e-05,
"loss": 0.0534,
"step": 6148
},
{
"epoch": 58.0,
"eval_LOCATION_f1": 0.7692307692307694,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7058823529411765,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7702702702702702,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6867469879518072,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7733333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6904761904761905,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14496611058712006,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8262032085561497,
"eval_overall_precision": 0.770573566084788,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.822,
"eval_steps_per_second": 9.174,
"step": 6148
},
{
"epoch": 59.0,
"grad_norm": 2.0102553367614746,
"learning_rate": 2.05e-05,
"loss": 0.0513,
"step": 6254
},
{
"epoch": 59.0,
"eval_LOCATION_f1": 0.7532467532467533,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6987951807228916,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7692307692307692,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6593406593406593,
"eval_ORGANIZATION_recall": 0.9230769230769231,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.912280701754386,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.896551724137931,
"eval_TIME_recall": 0.9285714285714286,
"eval_loss": 0.147059828042984,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8302387267904509,
"eval_overall_precision": 0.769041769041769,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3282,
"eval_samples_per_second": 569.709,
"eval_steps_per_second": 9.14,
"step": 6254
},
{
"epoch": 60.0,
"grad_norm": 1.5348504781723022,
"learning_rate": 2e-05,
"loss": 0.0524,
"step": 6360
},
{
"epoch": 60.0,
"eval_LOCATION_f1": 0.7631578947368421,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7160493827160493,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14413262903690338,
"eval_overall_accuracy": 0.9599903006789525,
"eval_overall_f1": 0.8273092369477911,
"eval_overall_precision": 0.7725,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.842,
"eval_steps_per_second": 9.174,
"step": 6360
},
{
"epoch": 61.0,
"grad_norm": 1.0918995141983032,
"learning_rate": 1.9500000000000003e-05,
"loss": 0.0523,
"step": 6466
},
{
"epoch": 61.0,
"eval_LOCATION_f1": 0.7581699346405228,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7073170731707317,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7564102564102564,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6483516483516484,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.888888888888889,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8484848484848485,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15414579212665558,
"eval_overall_accuracy": 0.9585354025218235,
"eval_overall_f1": 0.8222811671087533,
"eval_overall_precision": 0.7616707616707616,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3259,
"eval_samples_per_second": 573.773,
"eval_steps_per_second": 9.205,
"step": 6466
},
{
"epoch": 62.0,
"grad_norm": 0.9440881013870239,
"learning_rate": 1.9e-05,
"loss": 0.0531,
"step": 6572
},
{
"epoch": 62.0,
"eval_LOCATION_f1": 0.7814569536423841,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7375,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7682119205298013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6744186046511628,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15256355702877045,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8306451612903226,
"eval_overall_precision": 0.7783375314861462,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.326,
"eval_samples_per_second": 573.658,
"eval_steps_per_second": 9.203,
"step": 6572
},
{
"epoch": 63.0,
"grad_norm": 1.0544549226760864,
"learning_rate": 1.85e-05,
"loss": 0.0495,
"step": 6678
},
{
"epoch": 63.0,
"eval_LOCATION_f1": 0.7483870967741935,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.6904761904761905,
"eval_LOCATION_recall": 0.8169014084507042,
"eval_ORGANIZATION_f1": 0.7435897435897436,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6373626373626373,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8771929824561403,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8620689655172413,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1558208018541336,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8218085106382977,
"eval_overall_precision": 0.762962962962963,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.805,
"eval_steps_per_second": 9.173,
"step": 6678
},
{
"epoch": 64.0,
"grad_norm": 0.0981023833155632,
"learning_rate": 1.8e-05,
"loss": 0.0503,
"step": 6784
},
{
"epoch": 64.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7733333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6904761904761905,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15108107030391693,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8293333333333333,
"eval_overall_precision": 0.771712158808933,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3276,
"eval_samples_per_second": 570.896,
"eval_steps_per_second": 9.159,
"step": 6784
},
{
"epoch": 65.0,
"grad_norm": 0.6967347264289856,
"learning_rate": 1.75e-05,
"loss": 0.0517,
"step": 6890
},
{
"epoch": 65.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7702702702702702,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6867469879518072,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.8910256410256411,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8580246913580247,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14456935226917267,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8317631224764469,
"eval_overall_precision": 0.7803030303030303,
"eval_overall_recall": 0.8904899135446686,
"eval_runtime": 0.3275,
"eval_samples_per_second": 570.976,
"eval_steps_per_second": 9.16,
"step": 6890
},
{
"epoch": 66.0,
"grad_norm": 0.616130530834198,
"learning_rate": 1.7000000000000003e-05,
"loss": 0.0493,
"step": 6996
},
{
"epoch": 66.0,
"eval_LOCATION_f1": 0.7875000000000001,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7078651685393258,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7532467532467532,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.651685393258427,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7272727272727273,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6363636363636364,
"eval_QUANTITY_recall": 0.8484848484848485,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16076360642910004,
"eval_overall_accuracy": 0.9570805043646945,
"eval_overall_f1": 0.8236842105263158,
"eval_overall_precision": 0.7578692493946732,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3273,
"eval_samples_per_second": 571.374,
"eval_steps_per_second": 9.166,
"step": 6996
},
{
"epoch": 67.0,
"grad_norm": 0.8930002450942993,
"learning_rate": 1.65e-05,
"loss": 0.0508,
"step": 7102
},
{
"epoch": 67.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7581699346405228,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6590909090909091,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7631578947368421,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6744186046511628,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1603231132030487,
"eval_overall_accuracy": 0.957807953443259,
"eval_overall_f1": 0.8232189973614775,
"eval_overall_precision": 0.7591240875912408,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3264,
"eval_samples_per_second": 572.961,
"eval_steps_per_second": 9.192,
"step": 7102
},
{
"epoch": 68.0,
"grad_norm": 0.3851192891597748,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.0486,
"step": 7208
},
{
"epoch": 68.0,
"eval_LOCATION_f1": 0.7612903225806451,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7023809523809523,
"eval_LOCATION_recall": 0.8309859154929577,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7733333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6904761904761905,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14870406687259674,
"eval_overall_accuracy": 0.9595053346265762,
"eval_overall_f1": 0.8213333333333332,
"eval_overall_precision": 0.7642679900744417,
"eval_overall_recall": 0.8876080691642652,
"eval_runtime": 0.3249,
"eval_samples_per_second": 575.524,
"eval_steps_per_second": 9.233,
"step": 7208
},
{
"epoch": 69.0,
"grad_norm": 0.668571949005127,
"learning_rate": 1.55e-05,
"loss": 0.0475,
"step": 7314
},
{
"epoch": 69.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8945686900958466,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8588957055214724,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15184400975704193,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8353413654618473,
"eval_overall_precision": 0.78,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3285,
"eval_samples_per_second": 569.263,
"eval_steps_per_second": 9.133,
"step": 7314
},
{
"epoch": 70.0,
"grad_norm": 1.2341712713241577,
"learning_rate": 1.5e-05,
"loss": 0.0491,
"step": 7420
},
{
"epoch": 70.0,
"eval_LOCATION_f1": 0.8133333333333335,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7721518987341772,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.14618448913097382,
"eval_overall_accuracy": 0.9629000969932104,
"eval_overall_f1": 0.8389715832205683,
"eval_overall_precision": 0.7908163265306123,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3272,
"eval_samples_per_second": 571.603,
"eval_steps_per_second": 9.17,
"step": 7420
},
{
"epoch": 71.0,
"grad_norm": 0.7431372404098511,
"learning_rate": 1.45e-05,
"loss": 0.0462,
"step": 7526
},
{
"epoch": 71.0,
"eval_LOCATION_f1": 0.7848101265822784,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7126436781609196,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.888178913738019,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.852760736196319,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7733333333333333,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.6904761904761905,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1648775339126587,
"eval_overall_accuracy": 0.9582929194956353,
"eval_overall_f1": 0.8269484808454426,
"eval_overall_precision": 0.7634146341463415,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3274,
"eval_samples_per_second": 571.19,
"eval_steps_per_second": 9.163,
"step": 7526
},
{
"epoch": 72.0,
"grad_norm": 0.7144307494163513,
"learning_rate": 1.4000000000000001e-05,
"loss": 0.046,
"step": 7632
},
{
"epoch": 72.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7712418300653594,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6704545454545454,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.8903225806451613,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8625,
"eval_PERSON_recall": 0.92,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.7999999999999999,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.75,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1596042811870575,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8308921438082557,
"eval_overall_precision": 0.7722772277227723,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3254,
"eval_samples_per_second": 574.71,
"eval_steps_per_second": 9.22,
"step": 7632
},
{
"epoch": 73.0,
"grad_norm": 0.5636935830116272,
"learning_rate": 1.3500000000000001e-05,
"loss": 0.0453,
"step": 7738
},
{
"epoch": 73.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8938906752411575,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8633540372670807,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7837837837837839,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7073170731707317,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8474576271186439,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8064516129032258,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.1584891676902771,
"eval_overall_accuracy": 0.9592628516003879,
"eval_overall_f1": 0.8315508021390374,
"eval_overall_precision": 0.7755610972568578,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3271,
"eval_samples_per_second": 571.735,
"eval_steps_per_second": 9.172,
"step": 7738
},
{
"epoch": 74.0,
"grad_norm": 0.8465162515640259,
"learning_rate": 1.3000000000000001e-05,
"loss": 0.0467,
"step": 7844
},
{
"epoch": 74.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7516778523489933,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.8996763754045306,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8742138364779874,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1548159122467041,
"eval_overall_accuracy": 0.9604752667313288,
"eval_overall_f1": 0.8322147651006712,
"eval_overall_precision": 0.7788944723618091,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3278,
"eval_samples_per_second": 570.444,
"eval_steps_per_second": 9.152,
"step": 7844
},
{
"epoch": 75.0,
"grad_norm": 1.0343018770217896,
"learning_rate": 1.25e-05,
"loss": 0.0443,
"step": 7950
},
{
"epoch": 75.0,
"eval_LOCATION_f1": 0.823529411764706,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7682926829268293,
"eval_LOCATION_recall": 0.8873239436619719,
"eval_ORGANIZATION_f1": 0.7368421052631579,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6436781609195402,
"eval_ORGANIZATION_recall": 0.8615384615384616,
"eval_PERSON_f1": 0.9025974025974027,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.879746835443038,
"eval_PERSON_recall": 0.9266666666666666,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8135593220338982,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.7741935483870968,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15346647799015045,
"eval_overall_accuracy": 0.9616876818622696,
"eval_overall_f1": 0.8348993288590604,
"eval_overall_precision": 0.7814070351758794,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3271,
"eval_samples_per_second": 571.622,
"eval_steps_per_second": 9.17,
"step": 7950
},
{
"epoch": 76.0,
"grad_norm": 0.05382401496171951,
"learning_rate": 1.2e-05,
"loss": 0.0447,
"step": 8056
},
{
"epoch": 76.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7814569536423841,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.686046511627907,
"eval_ORGANIZATION_recall": 0.9076923076923077,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8620689655172413,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8333333333333334,
"eval_TIME_recall": 0.8928571428571429,
"eval_loss": 0.16000644862651825,
"eval_overall_accuracy": 0.9619301648884578,
"eval_overall_f1": 0.8467741935483871,
"eval_overall_precision": 0.7934508816120907,
"eval_overall_recall": 0.9077809798270894,
"eval_runtime": 0.326,
"eval_samples_per_second": 573.613,
"eval_steps_per_second": 9.202,
"step": 8056
},
{
"epoch": 77.0,
"grad_norm": 9.811291694641113,
"learning_rate": 1.1500000000000002e-05,
"loss": 0.0441,
"step": 8162
},
{
"epoch": 77.0,
"eval_LOCATION_f1": 0.7721518987341772,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7011494252873564,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7808219178082192,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.7037037037037037,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.8055555555555556,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.7435897435897436,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15801285207271576,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8371467025572005,
"eval_overall_precision": 0.7853535353535354,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.328,
"eval_samples_per_second": 570.116,
"eval_steps_per_second": 9.146,
"step": 8162
},
{
"epoch": 78.0,
"grad_norm": 1.3943322896957397,
"learning_rate": 1.1000000000000001e-05,
"loss": 0.0438,
"step": 8268
},
{
"epoch": 78.0,
"eval_LOCATION_f1": 0.782051282051282,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7176470588235294,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7785234899328859,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6904761904761905,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15934574604034424,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8387096774193548,
"eval_overall_precision": 0.7858942065491183,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3262,
"eval_samples_per_second": 573.317,
"eval_steps_per_second": 9.198,
"step": 8268
},
{
"epoch": 79.0,
"grad_norm": 0.6321301460266113,
"learning_rate": 1.05e-05,
"loss": 0.0449,
"step": 8374
},
{
"epoch": 79.0,
"eval_LOCATION_f1": 0.7843137254901961,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7317073170731707,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7651006711409396,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6785714285714286,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15974144637584686,
"eval_overall_accuracy": 0.960717749757517,
"eval_overall_f1": 0.8367071524966262,
"eval_overall_precision": 0.7868020304568528,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3286,
"eval_samples_per_second": 569.091,
"eval_steps_per_second": 9.13,
"step": 8374
},
{
"epoch": 80.0,
"grad_norm": 0.5539495348930359,
"learning_rate": 1e-05,
"loss": 0.0436,
"step": 8480
},
{
"epoch": 80.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7785234899328859,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6904761904761905,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16229036450386047,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8421052631578949,
"eval_overall_precision": 0.7918781725888325,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3259,
"eval_samples_per_second": 573.851,
"eval_steps_per_second": 9.206,
"step": 8480
},
{
"epoch": 81.0,
"grad_norm": 3.007709503173828,
"learning_rate": 9.5e-06,
"loss": 0.0434,
"step": 8586
},
{
"epoch": 81.0,
"eval_LOCATION_f1": 0.8,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7380952380952381,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7581699346405228,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6590909090909091,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8275862068965518,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1612003743648529,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.835781041388518,
"eval_overall_precision": 0.7786069651741293,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3275,
"eval_samples_per_second": 571.067,
"eval_steps_per_second": 9.162,
"step": 8586
},
{
"epoch": 82.0,
"grad_norm": 1.6446222066879272,
"learning_rate": 9e-06,
"loss": 0.0428,
"step": 8692
},
{
"epoch": 82.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7586206896551724,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6875,
"eval_ORGANIZATION_recall": 0.8461538461538461,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15457752346992493,
"eval_overall_accuracy": 0.9616876818622696,
"eval_overall_f1": 0.8401084010840109,
"eval_overall_precision": 0.7928388746803069,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3262,
"eval_samples_per_second": 573.188,
"eval_steps_per_second": 9.196,
"step": 8692
},
{
"epoch": 83.0,
"grad_norm": 0.6172337532043457,
"learning_rate": 8.500000000000002e-06,
"loss": 0.043,
"step": 8798
},
{
"epoch": 83.0,
"eval_LOCATION_f1": 0.7792207792207793,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7228915662650602,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.76,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6705882352941176,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16485904157161713,
"eval_overall_accuracy": 0.9590203685741998,
"eval_overall_f1": 0.8344549125168236,
"eval_overall_precision": 0.7828282828282829,
"eval_overall_recall": 0.8933717579250721,
"eval_runtime": 0.3271,
"eval_samples_per_second": 571.666,
"eval_steps_per_second": 9.171,
"step": 8798
},
{
"epoch": 84.0,
"grad_norm": 0.48714974522590637,
"learning_rate": 8.000000000000001e-06,
"loss": 0.0451,
"step": 8904
},
{
"epoch": 84.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7755102040816327,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6951219512195121,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15948227047920227,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8421052631578949,
"eval_overall_precision": 0.7918781725888325,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3279,
"eval_samples_per_second": 570.348,
"eval_steps_per_second": 9.15,
"step": 8904
},
{
"epoch": 85.0,
"grad_norm": 0.8867198824882507,
"learning_rate": 7.5e-06,
"loss": 0.0444,
"step": 9010
},
{
"epoch": 85.0,
"eval_LOCATION_f1": 0.8051948051948051,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7469879518072289,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7682119205298013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6744186046511628,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16462980210781097,
"eval_overall_accuracy": 0.960717749757517,
"eval_overall_f1": 0.8413978494623656,
"eval_overall_precision": 0.7884130982367759,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3281,
"eval_samples_per_second": 569.983,
"eval_steps_per_second": 9.144,
"step": 9010
},
{
"epoch": 86.0,
"grad_norm": 0.4750601649284363,
"learning_rate": 7.000000000000001e-06,
"loss": 0.0406,
"step": 9116
},
{
"epoch": 86.0,
"eval_LOCATION_f1": 0.8026315789473684,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7530864197530864,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7702702702702702,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6867469879518072,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9096774193548387,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.88125,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15999138355255127,
"eval_overall_accuracy": 0.9619301648884578,
"eval_overall_f1": 0.8432432432432433,
"eval_overall_precision": 0.7938931297709924,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3277,
"eval_samples_per_second": 570.57,
"eval_steps_per_second": 9.154,
"step": 9116
},
{
"epoch": 87.0,
"grad_norm": 0.6775397658348083,
"learning_rate": 6.5000000000000004e-06,
"loss": 0.0415,
"step": 9222
},
{
"epoch": 87.0,
"eval_LOCATION_f1": 0.8104575163398693,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7560975609756098,
"eval_LOCATION_recall": 0.8732394366197183,
"eval_ORGANIZATION_f1": 0.7785234899328859,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6904761904761905,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16279393434524536,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8413978494623656,
"eval_overall_precision": 0.7884130982367759,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3261,
"eval_samples_per_second": 573.372,
"eval_steps_per_second": 9.198,
"step": 9222
},
{
"epoch": 88.0,
"grad_norm": 0.4834389090538025,
"learning_rate": 6e-06,
"loss": 0.0407,
"step": 9328
},
{
"epoch": 88.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7682119205298013,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6744186046511628,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9061488673139159,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8805031446540881,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8571428571428571,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8571428571428571,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1641407161951065,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8409703504043127,
"eval_overall_precision": 0.789873417721519,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3268,
"eval_samples_per_second": 572.15,
"eval_steps_per_second": 9.179,
"step": 9328
},
{
"epoch": 89.0,
"grad_norm": 3.0661368370056152,
"learning_rate": 5.500000000000001e-06,
"loss": 0.0426,
"step": 9434
},
{
"epoch": 89.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7733333333333334,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6823529411764706,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9067524115755627,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1607460379600525,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8413978494623656,
"eval_overall_precision": 0.7884130982367759,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3275,
"eval_samples_per_second": 571.022,
"eval_steps_per_second": 9.161,
"step": 9434
},
{
"epoch": 90.0,
"grad_norm": 0.5167478919029236,
"learning_rate": 5e-06,
"loss": 0.041,
"step": 9540
},
{
"epoch": 90.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7837837837837838,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6987951807228916,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16166909039020538,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8421052631578949,
"eval_overall_precision": 0.7918781725888325,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3276,
"eval_samples_per_second": 570.818,
"eval_steps_per_second": 9.158,
"step": 9540
},
{
"epoch": 91.0,
"grad_norm": 0.6979191303253174,
"learning_rate": 4.5e-06,
"loss": 0.0406,
"step": 9646
},
{
"epoch": 91.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16465260088443756,
"eval_overall_accuracy": 0.960717749757517,
"eval_overall_f1": 0.8375838926174496,
"eval_overall_precision": 0.7839195979899497,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3268,
"eval_samples_per_second": 572.184,
"eval_steps_per_second": 9.179,
"step": 9646
},
{
"epoch": 92.0,
"grad_norm": 0.35358938574790955,
"learning_rate": 4.000000000000001e-06,
"loss": 0.0408,
"step": 9752
},
{
"epoch": 92.0,
"eval_LOCATION_f1": 0.7894736842105262,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7407407407407407,
"eval_LOCATION_recall": 0.8450704225352113,
"eval_ORGANIZATION_f1": 0.7702702702702702,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6867469879518072,
"eval_ORGANIZATION_recall": 0.8769230769230769,
"eval_PERSON_f1": 0.9067524115755627,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.15703369677066803,
"eval_overall_accuracy": 0.962172647914646,
"eval_overall_f1": 0.8394062078272604,
"eval_overall_precision": 0.7893401015228426,
"eval_overall_recall": 0.8962536023054755,
"eval_runtime": 0.3273,
"eval_samples_per_second": 571.285,
"eval_steps_per_second": 9.165,
"step": 9752
},
{
"epoch": 93.0,
"grad_norm": 0.4786812365055084,
"learning_rate": 3.5000000000000004e-06,
"loss": 0.0411,
"step": 9858
},
{
"epoch": 93.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9067524115755627,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1660545915365219,
"eval_overall_accuracy": 0.960717749757517,
"eval_overall_f1": 0.8380187416331996,
"eval_overall_precision": 0.7825,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.328,
"eval_samples_per_second": 570.159,
"eval_steps_per_second": 9.147,
"step": 9858
},
{
"epoch": 94.0,
"grad_norm": 0.8427369594573975,
"learning_rate": 3e-06,
"loss": 0.04,
"step": 9964
},
{
"epoch": 94.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16458158195018768,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8375838926174496,
"eval_overall_precision": 0.7839195979899497,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.327,
"eval_samples_per_second": 571.854,
"eval_steps_per_second": 9.174,
"step": 9964
},
{
"epoch": 95.0,
"grad_norm": 1.0689115524291992,
"learning_rate": 2.5e-06,
"loss": 0.0372,
"step": 10070
},
{
"epoch": 95.0,
"eval_LOCATION_f1": 0.7922077922077921,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7349397590361446,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9067524115755627,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8757763975155279,
"eval_PERSON_recall": 0.94,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16513913869857788,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8380187416331996,
"eval_overall_precision": 0.7825,
"eval_overall_recall": 0.9020172910662824,
"eval_runtime": 0.3273,
"eval_samples_per_second": 571.379,
"eval_steps_per_second": 9.167,
"step": 10070
},
{
"epoch": 96.0,
"grad_norm": 0.6339386105537415,
"learning_rate": 2.0000000000000003e-06,
"loss": 0.0393,
"step": 10176
},
{
"epoch": 96.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.8974358974358974,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.8641975308641975,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1637803018093109,
"eval_overall_accuracy": 0.9614451988360815,
"eval_overall_f1": 0.8353413654618473,
"eval_overall_precision": 0.78,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3261,
"eval_samples_per_second": 573.445,
"eval_steps_per_second": 9.2,
"step": 10176
},
{
"epoch": 97.0,
"grad_norm": 0.6922338604927063,
"learning_rate": 1.5e-06,
"loss": 0.0396,
"step": 10282
},
{
"epoch": 97.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16408979892730713,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8375838926174496,
"eval_overall_precision": 0.7839195979899497,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3277,
"eval_samples_per_second": 570.597,
"eval_steps_per_second": 9.154,
"step": 10282
},
{
"epoch": 98.0,
"grad_norm": 1.161203384399414,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0385,
"step": 10388
},
{
"epoch": 98.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1643643081188202,
"eval_overall_accuracy": 0.9609602327837051,
"eval_overall_f1": 0.8375838926174496,
"eval_overall_precision": 0.7839195979899497,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3284,
"eval_samples_per_second": 569.344,
"eval_steps_per_second": 9.134,
"step": 10388
},
{
"epoch": 99.0,
"grad_norm": 0.5302362442016602,
"learning_rate": 5.000000000000001e-07,
"loss": 0.0382,
"step": 10494
},
{
"epoch": 99.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.1647883802652359,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8375838926174496,
"eval_overall_precision": 0.7839195979899497,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3268,
"eval_samples_per_second": 572.201,
"eval_steps_per_second": 9.18,
"step": 10494
},
{
"epoch": 100.0,
"grad_norm": 0.16222168505191803,
"learning_rate": 0.0,
"loss": 0.0411,
"step": 10600
},
{
"epoch": 100.0,
"eval_LOCATION_f1": 0.7973856209150327,
"eval_LOCATION_number": 71,
"eval_LOCATION_precision": 0.7439024390243902,
"eval_LOCATION_recall": 0.8591549295774648,
"eval_ORGANIZATION_f1": 0.7631578947368421,
"eval_ORGANIZATION_number": 65,
"eval_ORGANIZATION_precision": 0.6666666666666666,
"eval_ORGANIZATION_recall": 0.8923076923076924,
"eval_PERSON_f1": 0.9032258064516129,
"eval_PERSON_number": 150,
"eval_PERSON_precision": 0.875,
"eval_PERSON_recall": 0.9333333333333333,
"eval_QUANTITY_f1": 0.7945205479452054,
"eval_QUANTITY_number": 33,
"eval_QUANTITY_precision": 0.725,
"eval_QUANTITY_recall": 0.8787878787878788,
"eval_TIME_f1": 0.8421052631578947,
"eval_TIME_number": 28,
"eval_TIME_precision": 0.8275862068965517,
"eval_TIME_recall": 0.8571428571428571,
"eval_loss": 0.16485615074634552,
"eval_overall_accuracy": 0.9612027158098934,
"eval_overall_f1": 0.8375838926174496,
"eval_overall_precision": 0.7839195979899497,
"eval_overall_recall": 0.899135446685879,
"eval_runtime": 0.3263,
"eval_samples_per_second": 573.127,
"eval_steps_per_second": 9.195,
"step": 10600
},
{
"epoch": 100.0,
"step": 10600,
"total_flos": 5123217774191952.0,
"train_loss": 0.08768324019773951,
"train_runtime": 561.3026,
"train_samples_per_second": 300.729,
"train_steps_per_second": 18.885
}
],
"logging_steps": 500,
"max_steps": 10600,
"num_input_tokens_seen": 0,
"num_train_epochs": 100,
"save_steps": 500,
"total_flos": 5123217774191952.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}