{ "best_metric": null, "best_model_checkpoint": null, "epoch": 100.0, "eval_steps": 500, "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 2.6862921714782715, "learning_rate": 4.9500000000000004e-05, "loss": 0.9792, "step": 106 }, { "epoch": 1.0, "eval_LOCATION_f1": 0.0, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.0, "eval_LOCATION_recall": 0.0, "eval_ORGANIZATION_f1": 0.0, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.0, "eval_ORGANIZATION_recall": 0.0, "eval_PERSON_f1": 0.18095238095238095, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.31666666666666665, "eval_PERSON_recall": 0.12666666666666668, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.06666666666666667, "eval_TIME_number": 28, "eval_TIME_precision": 0.5, "eval_TIME_recall": 0.03571428571428571, "eval_loss": 0.5512092113494873, "eval_overall_accuracy": 0.850387972841901, "eval_overall_f1": 0.09501187648456057, "eval_overall_precision": 0.2702702702702703, "eval_overall_recall": 0.05763688760806916, "eval_runtime": 0.3324, "eval_samples_per_second": 562.651, "eval_steps_per_second": 9.026, "step": 106 }, { "epoch": 2.0, "grad_norm": 1.0679957866668701, "learning_rate": 4.9e-05, "loss": 0.4837, "step": 212 }, { "epoch": 2.0, "eval_LOCATION_f1": 0.41739130434782606, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5454545454545454, "eval_LOCATION_recall": 0.3380281690140845, "eval_ORGANIZATION_f1": 0.019801980198019802, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.027777777777777776, "eval_ORGANIZATION_recall": 0.015384615384615385, "eval_PERSON_f1": 0.6831955922865013, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.5821596244131455, "eval_PERSON_recall": 0.8266666666666667, "eval_QUANTITY_f1": 0.0, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.0, "eval_QUANTITY_recall": 0.0, "eval_TIME_f1": 0.5454545454545454, "eval_TIME_number": 28, "eval_TIME_precision": 0.47368421052631576, "eval_TIME_recall": 0.6428571428571429, "eval_loss": 0.33068543672561646, "eval_overall_accuracy": 0.9022793404461688, "eval_overall_f1": 0.4798850574712644, "eval_overall_precision": 0.4785100286532951, "eval_overall_recall": 0.4812680115273775, "eval_runtime": 0.3251, "eval_samples_per_second": 575.209, "eval_steps_per_second": 9.228, "step": 212 }, { "epoch": 3.0, "grad_norm": 0.8312263488769531, "learning_rate": 4.85e-05, "loss": 0.3133, "step": 318 }, { "epoch": 3.0, "eval_LOCATION_f1": 0.5306122448979592, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5131578947368421, "eval_LOCATION_recall": 0.5492957746478874, "eval_ORGANIZATION_f1": 0.4000000000000001, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.34444444444444444, "eval_ORGANIZATION_recall": 0.47692307692307695, "eval_PERSON_f1": 0.7710843373493976, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7032967032967034, "eval_PERSON_recall": 0.8533333333333334, "eval_QUANTITY_f1": 0.5194805194805195, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.45454545454545453, "eval_QUANTITY_recall": 0.6060606060606061, "eval_TIME_f1": 0.793103448275862, "eval_TIME_number": 28, "eval_TIME_precision": 0.7666666666666667, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.21400973200798035, "eval_overall_accuracy": 0.9308923375363725, "eval_overall_f1": 0.6267880364109232, "eval_overall_precision": 0.5710900473933649, "eval_overall_recall": 0.6945244956772334, "eval_runtime": 0.3261, "eval_samples_per_second": 573.482, "eval_steps_per_second": 9.2, "step": 318 }, { "epoch": 4.0, "grad_norm": 1.0169802904129028, "learning_rate": 4.8e-05, "loss": 0.2327, "step": 424 }, { "epoch": 4.0, "eval_LOCATION_f1": 0.6436781609195402, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.5436893203883495, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.5590062111801243, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.46875, "eval_ORGANIZATION_recall": 0.6923076923076923, "eval_PERSON_f1": 0.8421052631578947, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.7861271676300579, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.5897435897435898, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5111111111111111, "eval_QUANTITY_recall": 0.696969696969697, "eval_TIME_f1": 0.7719298245614034, "eval_TIME_number": 28, "eval_TIME_precision": 0.7586206896551724, "eval_TIME_recall": 0.7857142857142857, "eval_loss": 0.17442111670970917, "eval_overall_accuracy": 0.9408341416100873, "eval_overall_f1": 0.7112232030264818, "eval_overall_precision": 0.6322869955156951, "eval_overall_recall": 0.8126801152737753, "eval_runtime": 0.3287, "eval_samples_per_second": 568.904, "eval_steps_per_second": 9.127, "step": 424 }, { "epoch": 5.0, "grad_norm": 1.3268284797668457, "learning_rate": 4.75e-05, "loss": 0.1989, "step": 530 }, { "epoch": 5.0, "eval_LOCATION_f1": 0.7215189873417721, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6551724137931034, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.6493506493506495, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5617977528089888, "eval_ORGANIZATION_recall": 0.7692307692307693, "eval_PERSON_f1": 0.8652037617554857, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8165680473372781, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6329113924050633, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5434782608695652, "eval_QUANTITY_recall": 0.7575757575757576, "eval_TIME_f1": 0.7796610169491526, "eval_TIME_number": 28, "eval_TIME_precision": 0.7419354838709677, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.1507454365491867, "eval_overall_accuracy": 0.9481086323957323, "eval_overall_f1": 0.7620286085825748, "eval_overall_precision": 0.6943127962085308, "eval_overall_recall": 0.8443804034582133, "eval_runtime": 0.3267, "eval_samples_per_second": 572.456, "eval_steps_per_second": 9.184, "step": 530 }, { "epoch": 6.0, "grad_norm": 1.4492706060409546, "learning_rate": 4.7e-05, "loss": 0.1782, "step": 636 }, { "epoch": 6.0, "eval_LOCATION_f1": 0.7088607594936709, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6436781609195402, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.6473988439306357, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5185185185185185, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8598130841121495, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8070175438596491, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.6352941176470589, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5192307692307693, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.746268656716418, "eval_TIME_number": 28, "eval_TIME_precision": 0.6410256410256411, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.17294442653656006, "eval_overall_accuracy": 0.9425315227934045, "eval_overall_f1": 0.7512437810945274, "eval_overall_precision": 0.6608315098468271, "eval_overall_recall": 0.8703170028818443, "eval_runtime": 0.327, "eval_samples_per_second": 571.852, "eval_steps_per_second": 9.174, "step": 636 }, { "epoch": 7.0, "grad_norm": 2.372952938079834, "learning_rate": 4.6500000000000005e-05, "loss": 0.1675, "step": 742 }, { "epoch": 7.0, "eval_LOCATION_f1": 0.7407407407407407, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6593406593406593, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.675, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5684210526315789, "eval_ORGANIZATION_recall": 0.8307692307692308, "eval_PERSON_f1": 0.8706624605678233, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8263473053892215, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7179487179487178, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6222222222222222, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.75, "eval_TIME_number": 28, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1436489075422287, "eval_overall_accuracy": 0.950533462657614, "eval_overall_f1": 0.7784891165172856, "eval_overall_precision": 0.7004608294930875, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3264, "eval_samples_per_second": 572.836, "eval_steps_per_second": 9.19, "step": 742 }, { "epoch": 8.0, "grad_norm": 0.5531976222991943, "learning_rate": 4.600000000000001e-05, "loss": 0.1523, "step": 848 }, { "epoch": 8.0, "eval_LOCATION_f1": 0.7643312101910827, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6976744186046512, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.6832298136645962, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5729166666666666, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8670886075949367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8253012048192772, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7936507936507937, "eval_TIME_number": 28, "eval_TIME_precision": 0.7142857142857143, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1423933058977127, "eval_overall_accuracy": 0.9527158098933075, "eval_overall_f1": 0.7891332470892625, "eval_overall_precision": 0.715962441314554, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3281, "eval_samples_per_second": 570.034, "eval_steps_per_second": 9.145, "step": 848 }, { "epoch": 9.0, "grad_norm": 1.0425461530685425, "learning_rate": 4.55e-05, "loss": 0.148, "step": 954 }, { "epoch": 9.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7466666666666668, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6588235294117647, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8690095846645367, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8343558282208589, "eval_PERSON_recall": 0.9066666666666666, "eval_QUANTITY_f1": 0.6666666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5777777777777777, "eval_QUANTITY_recall": 0.7878787878787878, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13000667095184326, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8015873015873015, "eval_overall_precision": 0.7408312958435208, "eval_overall_recall": 0.8731988472622478, "eval_runtime": 0.3275, "eval_samples_per_second": 571.032, "eval_steps_per_second": 9.161, "step": 954 }, { "epoch": 10.0, "grad_norm": 0.9898656606674194, "learning_rate": 4.5e-05, "loss": 0.1376, "step": 1060 }, { "epoch": 10.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7320261437908497, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6363636363636364, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.888178913738019, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7088607594936709, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6086956521739131, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12935131788253784, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8131578947368422, "eval_overall_precision": 0.7481840193704601, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3271, "eval_samples_per_second": 571.762, "eval_steps_per_second": 9.173, "step": 1060 }, { "epoch": 11.0, "grad_norm": 1.2879328727722168, "learning_rate": 4.4500000000000004e-05, "loss": 0.1378, "step": 1166 }, { "epoch": 11.0, "eval_LOCATION_f1": 0.7532467532467533, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6987951807228916, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.728476821192053, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6395348837209303, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.888178913738019, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 28, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12860190868377686, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.8063660477453581, "eval_overall_precision": 0.7469287469287469, "eval_overall_recall": 0.8760806916426513, "eval_runtime": 0.3281, "eval_samples_per_second": 570.029, "eval_steps_per_second": 9.145, "step": 1166 }, { "epoch": 12.0, "grad_norm": 1.0456236600875854, "learning_rate": 4.4000000000000006e-05, "loss": 0.1279, "step": 1272 }, { "epoch": 12.0, "eval_LOCATION_f1": 0.728395061728395, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6483516483516484, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7375, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6210526315789474, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.6865671641791046, "eval_TIME_number": 28, "eval_TIME_precision": 0.5897435897435898, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.14702975749969482, "eval_overall_accuracy": 0.9524733268671193, "eval_overall_f1": 0.7953667953667953, "eval_overall_precision": 0.7186046511627907, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.329, "eval_samples_per_second": 568.322, "eval_steps_per_second": 9.117, "step": 1272 }, { "epoch": 13.0, "grad_norm": 0.7470729351043701, "learning_rate": 4.35e-05, "loss": 0.1257, "step": 1378 }, { "epoch": 13.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8917197452229298, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8070175438596492, "eval_TIME_number": 28, "eval_TIME_precision": 0.7931034482758621, "eval_TIME_recall": 0.8214285714285714, "eval_loss": 0.12572742998600006, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.823529411764706, "eval_overall_precision": 0.7680798004987531, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.326, "eval_samples_per_second": 573.579, "eval_steps_per_second": 9.202, "step": 1378 }, { "epoch": 14.0, "grad_norm": 1.587265133857727, "learning_rate": 4.3e-05, "loss": 0.1211, "step": 1484 }, { "epoch": 14.0, "eval_LOCATION_f1": 0.7643312101910827, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6976744186046512, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6704545454545454, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8753993610223643, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8404907975460123, "eval_PERSON_recall": 0.9133333333333333, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.6956521739130435, "eval_TIME_number": 28, "eval_TIME_precision": 0.5853658536585366, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12821051478385925, "eval_overall_accuracy": 0.9565955383123181, "eval_overall_f1": 0.8031290743155148, "eval_overall_precision": 0.7333333333333333, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3277, "eval_samples_per_second": 570.653, "eval_steps_per_second": 9.155, "step": 1484 }, { "epoch": 15.0, "grad_norm": 1.1898987293243408, "learning_rate": 4.25e-05, "loss": 0.1182, "step": 1590 }, { "epoch": 15.0, "eval_LOCATION_f1": 0.794701986754967, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7532467532467532, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.651685393258427, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12380851060152054, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8255659121171772, "eval_overall_precision": 0.7673267326732673, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3297, "eval_samples_per_second": 567.219, "eval_steps_per_second": 9.1, "step": 1590 }, { "epoch": 16.0, "grad_norm": 1.2394359111785889, "learning_rate": 4.2e-05, "loss": 0.1084, "step": 1696 }, { "epoch": 16.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6704545454545454, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.888178913738019, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7741935483870968, "eval_TIME_number": 28, "eval_TIME_precision": 0.7058823529411765, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12522907555103302, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8180610889774237, "eval_overall_precision": 0.7586206896551724, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3284, "eval_samples_per_second": 569.484, "eval_steps_per_second": 9.136, "step": 1696 }, { "epoch": 17.0, "grad_norm": 0.5448505878448486, "learning_rate": 4.15e-05, "loss": 0.11, "step": 1802 }, { "epoch": 17.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7428571428571429, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6933333333333334, "eval_ORGANIZATION_recall": 0.8, "eval_PERSON_f1": 0.8917197452229298, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.11857786774635315, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8243243243243243, "eval_overall_precision": 0.7760814249363868, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3269, "eval_samples_per_second": 572.103, "eval_steps_per_second": 9.178, "step": 1802 }, { "epoch": 18.0, "grad_norm": 0.928116500377655, "learning_rate": 4.1e-05, "loss": 0.105, "step": 1908 }, { "epoch": 18.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7402597402597403, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6404494382022472, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.736842105263158, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6511627906976745, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.75, "eval_TIME_number": 28, "eval_TIME_precision": 0.6666666666666666, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13439632952213287, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8153034300791556, "eval_overall_precision": 0.7518248175182481, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3276, "eval_samples_per_second": 570.855, "eval_steps_per_second": 9.158, "step": 1908 }, { "epoch": 19.0, "grad_norm": 0.6120880246162415, "learning_rate": 4.05e-05, "loss": 0.1012, "step": 2014 }, { "epoch": 19.0, "eval_LOCATION_f1": 0.778523489932886, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7435897435897436, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.76, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6705882352941176, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.8000000000000002, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7567567567567568, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1134907528758049, "eval_overall_accuracy": 0.9643549951503395, "eval_overall_f1": 0.8299319727891157, "eval_overall_precision": 0.7860824742268041, "eval_overall_recall": 0.8789625360230547, "eval_runtime": 0.3267, "eval_samples_per_second": 572.422, "eval_steps_per_second": 9.183, "step": 2014 }, { "epoch": 20.0, "grad_norm": 0.7189091444015503, "learning_rate": 4e-05, "loss": 0.1009, "step": 2120 }, { "epoch": 20.0, "eval_LOCATION_f1": 0.8129032258064516, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.75, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.763888888888889, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6962025316455697, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.887459807073955, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8571428571428571, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.11710327118635178, "eval_overall_accuracy": 0.9636275460717749, "eval_overall_f1": 0.8324324324324324, "eval_overall_precision": 0.7837150127226463, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3264, "eval_samples_per_second": 572.982, "eval_steps_per_second": 9.192, "step": 2120 }, { "epoch": 21.0, "grad_norm": 1.2998398542404175, "learning_rate": 3.9500000000000005e-05, "loss": 0.0994, "step": 2226 }, { "epoch": 21.0, "eval_LOCATION_f1": 0.7777777777777779, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6923076923076923, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7972027972027972, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7307692307692307, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9038461538461539, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5957446808510638, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1276998519897461, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8295904887714662, "eval_overall_precision": 0.7658536585365854, "eval_overall_recall": 0.9048991354466859, "eval_runtime": 0.3284, "eval_samples_per_second": 569.448, "eval_steps_per_second": 9.136, "step": 2226 }, { "epoch": 22.0, "grad_norm": 0.8688408136367798, "learning_rate": 3.9000000000000006e-05, "loss": 0.0947, "step": 2332 }, { "epoch": 22.0, "eval_LOCATION_f1": 0.7530864197530862, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6703296703296703, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.759493670886076, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6451612903225806, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.6829268292682927, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5714285714285714, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7619047619047619, "eval_TIME_number": 28, "eval_TIME_precision": 0.6857142857142857, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14317628741264343, "eval_overall_accuracy": 0.9536857419980601, "eval_overall_f1": 0.8067010309278351, "eval_overall_precision": 0.7296037296037297, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3269, "eval_samples_per_second": 571.972, "eval_steps_per_second": 9.176, "step": 2332 }, { "epoch": 23.0, "grad_norm": 1.058230996131897, "learning_rate": 3.85e-05, "loss": 0.0922, "step": 2438 }, { "epoch": 23.0, "eval_LOCATION_f1": 0.8025477707006369, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7325581395348837, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6704545454545454, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8000000000000002, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7567567567567568, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.11902488023042679, "eval_overall_accuracy": 0.9643549951503395, "eval_overall_f1": 0.84, "eval_overall_precision": 0.7816377171215881, "eval_overall_recall": 0.9077809798270894, "eval_runtime": 0.3269, "eval_samples_per_second": 572.066, "eval_steps_per_second": 9.178, "step": 2438 }, { "epoch": 24.0, "grad_norm": 1.2606264352798462, "learning_rate": 3.8e-05, "loss": 0.0917, "step": 2544 }, { "epoch": 24.0, "eval_LOCATION_f1": 0.7530864197530862, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6703296703296703, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7534246575342466, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6790123456790124, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13196653127670288, "eval_overall_accuracy": 0.9587778855480117, "eval_overall_f1": 0.8186666666666667, "eval_overall_precision": 0.7617866004962779, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3273, "eval_samples_per_second": 571.298, "eval_steps_per_second": 9.165, "step": 2544 }, { "epoch": 25.0, "grad_norm": 0.8119063973426819, "learning_rate": 3.7500000000000003e-05, "loss": 0.0895, "step": 2650 }, { "epoch": 25.0, "eval_LOCATION_f1": 0.7625, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6853932584269663, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7755102040816327, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6951219512195121, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.896774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.86875, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12873846292495728, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8233731739707836, "eval_overall_precision": 0.7635467980295566, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3259, "eval_samples_per_second": 573.763, "eval_steps_per_second": 9.205, "step": 2650 }, { "epoch": 26.0, "grad_norm": 0.6412087082862854, "learning_rate": 3.7e-05, "loss": 0.0915, "step": 2756 }, { "epoch": 26.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.759493670886076, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6444444444444445, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6363636363636364, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12941302359104156, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8244680851063829, "eval_overall_precision": 0.7654320987654321, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3264, "eval_samples_per_second": 572.875, "eval_steps_per_second": 9.191, "step": 2756 }, { "epoch": 27.0, "grad_norm": 1.1233749389648438, "learning_rate": 3.65e-05, "loss": 0.0857, "step": 2862 }, { "epoch": 27.0, "eval_LOCATION_f1": 0.775, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6966292134831461, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7662337662337663, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6629213483146067, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.9067524115755627, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8757763975155279, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.6428571428571428, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.5294117647058824, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.78125, "eval_TIME_number": 28, "eval_TIME_precision": 0.6944444444444444, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14580127596855164, "eval_overall_accuracy": 0.9553831231813773, "eval_overall_f1": 0.8124191461836998, "eval_overall_precision": 0.7370892018779343, "eval_overall_recall": 0.9048991354466859, "eval_runtime": 0.3274, "eval_samples_per_second": 571.119, "eval_steps_per_second": 9.162, "step": 2862 }, { "epoch": 28.0, "grad_norm": 2.415337085723877, "learning_rate": 3.6e-05, "loss": 0.0846, "step": 2968 }, { "epoch": 28.0, "eval_LOCATION_f1": 0.7837837837837838, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7532467532467533, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7763157894736842, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6781609195402298, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.9009584664536742, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8650306748466258, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12516556680202484, "eval_overall_accuracy": 0.9636275460717749, "eval_overall_f1": 0.8337801608579088, "eval_overall_precision": 0.7794486215538847, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3273, "eval_samples_per_second": 571.332, "eval_steps_per_second": 9.166, "step": 2968 }, { "epoch": 29.0, "grad_norm": 0.36568284034729004, "learning_rate": 3.55e-05, "loss": 0.0828, "step": 3074 }, { "epoch": 29.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7361963190184049, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6122448979591837, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7777777777777778, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.717948717948718, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12355955690145493, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8289473684210527, "eval_overall_precision": 0.7627118644067796, "eval_overall_recall": 0.9077809798270894, "eval_runtime": 0.3266, "eval_samples_per_second": 572.645, "eval_steps_per_second": 9.187, "step": 3074 }, { "epoch": 30.0, "grad_norm": 2.264235019683838, "learning_rate": 3.5e-05, "loss": 0.081, "step": 3180 }, { "epoch": 30.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7317073170731707, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6060606060606061, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13108646869659424, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8241469816272966, "eval_overall_precision": 0.7566265060240964, "eval_overall_recall": 0.9048991354466859, "eval_runtime": 0.3263, "eval_samples_per_second": 573.006, "eval_steps_per_second": 9.193, "step": 3180 }, { "epoch": 31.0, "grad_norm": 0.646797239780426, "learning_rate": 3.45e-05, "loss": 0.0782, "step": 3286 }, { "epoch": 31.0, "eval_LOCATION_f1": 0.7530864197530862, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6703296703296703, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7532467532467532, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.651685393258427, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13420291244983673, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8167539267015707, "eval_overall_precision": 0.7482014388489209, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.327, "eval_samples_per_second": 571.836, "eval_steps_per_second": 9.174, "step": 3286 }, { "epoch": 32.0, "grad_norm": 0.6615414023399353, "learning_rate": 3.4000000000000007e-05, "loss": 0.0812, "step": 3392 }, { "epoch": 32.0, "eval_LOCATION_f1": 0.751592356687898, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.686046511627907, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7483870967741936, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6444444444444445, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12814216315746307, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8174603174603176, "eval_overall_precision": 0.7555012224938875, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.327, "eval_samples_per_second": 571.795, "eval_steps_per_second": 9.173, "step": 3392 }, { "epoch": 33.0, "grad_norm": 1.0747178792953491, "learning_rate": 3.35e-05, "loss": 0.0759, "step": 3498 }, { "epoch": 33.0, "eval_LOCATION_f1": 0.7612903225806451, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.782051282051282, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6703296703296703, "eval_ORGANIZATION_recall": 0.9384615384615385, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12921784818172455, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8269484808454426, "eval_overall_precision": 0.7634146341463415, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3274, "eval_samples_per_second": 571.082, "eval_steps_per_second": 9.162, "step": 3498 }, { "epoch": 34.0, "grad_norm": 0.9548816084861755, "learning_rate": 3.3e-05, "loss": 0.0755, "step": 3604 }, { "epoch": 34.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7916666666666667, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7215189873417721, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.12423999607563019, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8279569892473119, "eval_overall_precision": 0.7758186397984886, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3276, "eval_samples_per_second": 570.793, "eval_steps_per_second": 9.157, "step": 3604 }, { "epoch": 35.0, "grad_norm": 0.42714256048202515, "learning_rate": 3.2500000000000004e-05, "loss": 0.0739, "step": 3710 }, { "epoch": 35.0, "eval_LOCATION_f1": 0.751592356687898, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.686046511627907, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7453416149068324, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.625, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.7868852459016394, "eval_TIME_number": 28, "eval_TIME_precision": 0.7272727272727273, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.13675132393836975, "eval_overall_accuracy": 0.9568380213385063, "eval_overall_f1": 0.8141361256544503, "eval_overall_precision": 0.7458033573141487, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3266, "eval_samples_per_second": 572.553, "eval_steps_per_second": 9.185, "step": 3710 }, { "epoch": 36.0, "grad_norm": 1.520427942276001, "learning_rate": 3.2000000000000005e-05, "loss": 0.0754, "step": 3816 }, { "epoch": 36.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7672955974842768, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.648936170212766, "eval_ORGANIZATION_recall": 0.9384615384615385, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1319383829832077, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8289473684210527, "eval_overall_precision": 0.7627118644067796, "eval_overall_recall": 0.9077809798270894, "eval_runtime": 0.3273, "eval_samples_per_second": 571.333, "eval_steps_per_second": 9.166, "step": 3816 }, { "epoch": 37.0, "grad_norm": 0.7817038893699646, "learning_rate": 3.15e-05, "loss": 0.0703, "step": 3922 }, { "epoch": 37.0, "eval_LOCATION_f1": 0.7530864197530862, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6703296703296703, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7402597402597403, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6404494382022472, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8980891719745222, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8597560975609756, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7012987012987013, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6136363636363636, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1478222757577896, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8093994778067884, "eval_overall_precision": 0.7398568019093079, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3267, "eval_samples_per_second": 572.415, "eval_steps_per_second": 9.183, "step": 3922 }, { "epoch": 38.0, "grad_norm": 0.6990446448326111, "learning_rate": 3.1e-05, "loss": 0.0735, "step": 4028 }, { "epoch": 38.0, "eval_LOCATION_f1": 0.8181818181818181, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7590361445783133, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.879746835443038, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8373493975903614, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.806451612903226, "eval_TIME_number": 28, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.12963485717773438, "eval_overall_accuracy": 0.9624151309408342, "eval_overall_f1": 0.8249336870026525, "eval_overall_precision": 0.7641277641277642, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.327, "eval_samples_per_second": 571.9, "eval_steps_per_second": 9.175, "step": 4028 }, { "epoch": 39.0, "grad_norm": 1.1196815967559814, "learning_rate": 3.05e-05, "loss": 0.0718, "step": 4134 }, { "epoch": 39.0, "eval_LOCATION_f1": 0.7402597402597403, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6867469879518072, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7375, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6210526315789474, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.9038461538461539, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8703703703703703, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7671232876712328, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13455747067928314, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8190224570673712, "eval_overall_precision": 0.7560975609756098, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3273, "eval_samples_per_second": 571.347, "eval_steps_per_second": 9.166, "step": 4134 }, { "epoch": 40.0, "grad_norm": 0.904691219329834, "learning_rate": 3e-05, "loss": 0.0694, "step": 4240 }, { "epoch": 40.0, "eval_LOCATION_f1": 0.7733333333333333, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7341772151898734, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7333333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6470588235294118, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7733333333333333, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6904761904761905, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.806451612903226, "eval_TIME_number": 28, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1319706290960312, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8186666666666667, "eval_overall_precision": 0.7617866004962779, "eval_overall_recall": 0.8847262247838616, "eval_runtime": 0.3287, "eval_samples_per_second": 568.914, "eval_steps_per_second": 9.127, "step": 4240 }, { "epoch": 41.0, "grad_norm": 0.4921020567417145, "learning_rate": 2.95e-05, "loss": 0.0693, "step": 4346 }, { "epoch": 41.0, "eval_LOCATION_f1": 0.7435897435897436, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6823529411764706, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7515923566878981, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6413043478260869, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.912621359223301, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8867924528301887, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7733333333333333, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6904761904761905, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14422298967838287, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8253968253968255, "eval_overall_precision": 0.7628361858190709, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3268, "eval_samples_per_second": 572.269, "eval_steps_per_second": 9.181, "step": 4346 }, { "epoch": 42.0, "grad_norm": 0.17059876024723053, "learning_rate": 2.9e-05, "loss": 0.0675, "step": 4452 }, { "epoch": 42.0, "eval_LOCATION_f1": 0.7763157894736843, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7283950617283951, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7866666666666665, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6941176470588235, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7466666666666666, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6666666666666666, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13859502971172333, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8266666666666667, "eval_overall_precision": 0.7692307692307693, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3267, "eval_samples_per_second": 572.428, "eval_steps_per_second": 9.183, "step": 4452 }, { "epoch": 43.0, "grad_norm": 0.5693849325180054, "learning_rate": 2.8499999999999998e-05, "loss": 0.0672, "step": 4558 }, { "epoch": 43.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.806451612903226, "eval_TIME_number": 28, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13775749504566193, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8243064729194188, "eval_overall_precision": 0.7609756097560976, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.326, "eval_samples_per_second": 573.554, "eval_steps_per_second": 9.201, "step": 4558 }, { "epoch": 44.0, "grad_norm": 0.5870493650436401, "learning_rate": 2.8000000000000003e-05, "loss": 0.067, "step": 4664 }, { "epoch": 44.0, "eval_LOCATION_f1": 0.7866666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7468354430379747, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6704545454545454, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.8285714285714285, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7837837837837838, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13134053349494934, "eval_overall_accuracy": 0.9626576139670223, "eval_overall_f1": 0.8315508021390374, "eval_overall_precision": 0.7755610972568578, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.327, "eval_samples_per_second": 571.903, "eval_steps_per_second": 9.175, "step": 4664 }, { "epoch": 45.0, "grad_norm": 1.1741827726364136, "learning_rate": 2.7500000000000004e-05, "loss": 0.0656, "step": 4770 }, { "epoch": 45.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7837837837837838, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6987951807228916, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7200000000000001, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6428571428571429, "eval_QUANTITY_recall": 0.8181818181818182, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13948975503444672, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8320000000000001, "eval_overall_precision": 0.7741935483870968, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3274, "eval_samples_per_second": 571.187, "eval_steps_per_second": 9.163, "step": 4770 }, { "epoch": 46.0, "grad_norm": 0.8152003288269043, "learning_rate": 2.7000000000000002e-05, "loss": 0.0656, "step": 4876 }, { "epoch": 46.0, "eval_LOCATION_f1": 0.7662337662337662, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7108433734939759, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7450980392156863, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6477272727272727, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13262593746185303, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8222811671087533, "eval_overall_precision": 0.7616707616707616, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3275, "eval_samples_per_second": 571.056, "eval_steps_per_second": 9.161, "step": 4876 }, { "epoch": 47.0, "grad_norm": 0.9389750361442566, "learning_rate": 2.6500000000000004e-05, "loss": 0.062, "step": 4982 }, { "epoch": 47.0, "eval_LOCATION_f1": 0.7421383647798742, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6704545454545454, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7450980392156863, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6477272727272727, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8924050632911392, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8493975903614458, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7567567567567567, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6829268292682927, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.806451612903226, "eval_TIME_number": 28, "eval_TIME_precision": 0.7352941176470589, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15109694004058838, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.81151832460733, "eval_overall_precision": 0.7434052757793765, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3278, "eval_samples_per_second": 570.556, "eval_steps_per_second": 9.153, "step": 4982 }, { "epoch": 48.0, "grad_norm": 1.3758347034454346, "learning_rate": 2.6000000000000002e-05, "loss": 0.0638, "step": 5088 }, { "epoch": 48.0, "eval_LOCATION_f1": 0.7875000000000001, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7078651685393258, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8853503184713376, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8475609756097561, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7733333333333333, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6904761904761905, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1447124034166336, "eval_overall_accuracy": 0.9597478176527643, "eval_overall_f1": 0.8221343873517787, "eval_overall_precision": 0.7572815533980582, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.327, "eval_samples_per_second": 571.823, "eval_steps_per_second": 9.174, "step": 5088 }, { "epoch": 49.0, "grad_norm": 0.8612605333328247, "learning_rate": 2.5500000000000003e-05, "loss": 0.0601, "step": 5194 }, { "epoch": 49.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7567567567567568, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6746987951807228, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1353224217891693, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8288770053475935, "eval_overall_precision": 0.773067331670823, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3281, "eval_samples_per_second": 569.939, "eval_steps_per_second": 9.143, "step": 5194 }, { "epoch": 50.0, "grad_norm": 1.3004350662231445, "learning_rate": 2.5e-05, "loss": 0.0604, "step": 5300 }, { "epoch": 50.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7549668874172185, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6627906976744186, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1338462084531784, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8315508021390374, "eval_overall_precision": 0.7755610972568578, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3278, "eval_samples_per_second": 570.522, "eval_steps_per_second": 9.153, "step": 5300 }, { "epoch": 51.0, "grad_norm": 0.871790885925293, "learning_rate": 2.45e-05, "loss": 0.0582, "step": 5406 }, { "epoch": 51.0, "eval_LOCATION_f1": 0.7654320987654322, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6813186813186813, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7619047619047619, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6829268292682927, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9096774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.88125, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.819672131147541, "eval_TIME_number": 28, "eval_TIME_precision": 0.7575757575757576, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.13927897810935974, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8302387267904509, "eval_overall_precision": 0.769041769041769, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3272, "eval_samples_per_second": 571.49, "eval_steps_per_second": 9.168, "step": 5406 }, { "epoch": 52.0, "grad_norm": 0.7292200326919556, "learning_rate": 2.4e-05, "loss": 0.0608, "step": 5512 }, { "epoch": 52.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7295597484276729, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6170212765957447, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8789808917197452, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8414634146341463, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.1517271101474762, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8153034300791556, "eval_overall_precision": 0.7518248175182481, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3279, "eval_samples_per_second": 570.258, "eval_steps_per_second": 9.149, "step": 5512 }, { "epoch": 53.0, "grad_norm": 0.8021668791770935, "learning_rate": 2.35e-05, "loss": 0.0575, "step": 5618 }, { "epoch": 53.0, "eval_LOCATION_f1": 0.7466666666666666, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7088607594936709, "eval_LOCATION_recall": 0.7887323943661971, "eval_ORGANIZATION_f1": 0.7361963190184049, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6122448979591837, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8832807570977917, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8383233532934131, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.15490397810935974, "eval_overall_accuracy": 0.9556256062075654, "eval_overall_f1": 0.8125819134993448, "eval_overall_precision": 0.7451923076923077, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3281, "eval_samples_per_second": 570.008, "eval_steps_per_second": 9.145, "step": 5618 }, { "epoch": 54.0, "grad_norm": 1.3401607275009155, "learning_rate": 2.3000000000000003e-05, "loss": 0.0585, "step": 5724 }, { "epoch": 54.0, "eval_LOCATION_f1": 0.7402597402597403, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6867469879518072, "eval_LOCATION_recall": 0.8028169014084507, "eval_ORGANIZATION_f1": 0.7305389221556887, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.5980392156862745, "eval_ORGANIZATION_recall": 0.9384615384615385, "eval_PERSON_f1": 0.8825396825396825, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8424242424242424, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8813559322033899, "eval_TIME_number": 28, "eval_TIME_precision": 0.8387096774193549, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.16088581085205078, "eval_overall_accuracy": 0.9541707080504365, "eval_overall_f1": 0.811443433029909, "eval_overall_precision": 0.7393364928909952, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3275, "eval_samples_per_second": 570.964, "eval_steps_per_second": 9.16, "step": 5724 }, { "epoch": 55.0, "grad_norm": 0.5186824202537537, "learning_rate": 2.25e-05, "loss": 0.0571, "step": 5830 }, { "epoch": 55.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.75, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6551724137931034, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7733333333333333, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6904761904761905, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14577339589595795, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8282290279627165, "eval_overall_precision": 0.7698019801980198, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3267, "eval_samples_per_second": 572.313, "eval_steps_per_second": 9.181, "step": 5830 }, { "epoch": 56.0, "grad_norm": 1.0186669826507568, "learning_rate": 2.2000000000000003e-05, "loss": 0.0574, "step": 5936 }, { "epoch": 56.0, "eval_LOCATION_f1": 0.7848101265822784, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7126436781609196, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.90032154340836, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8695652173913043, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8333333333333334, "eval_TIME_number": 28, "eval_TIME_precision": 0.78125, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14299847185611725, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8308921438082557, "eval_overall_precision": 0.7722772277227723, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3268, "eval_samples_per_second": 572.282, "eval_steps_per_second": 9.181, "step": 5936 }, { "epoch": 57.0, "grad_norm": 0.6867424845695496, "learning_rate": 2.15e-05, "loss": 0.0549, "step": 6042 }, { "epoch": 57.0, "eval_LOCATION_f1": 0.779874213836478, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7045454545454546, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7808219178082192, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7037037037037037, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8917197452229298, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8536585365853658, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.14952713251113892, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.8335552596537948, "eval_overall_precision": 0.7747524752475248, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3268, "eval_samples_per_second": 572.296, "eval_steps_per_second": 9.181, "step": 6042 }, { "epoch": 58.0, "grad_norm": 0.42461711168289185, "learning_rate": 2.1e-05, "loss": 0.0534, "step": 6148 }, { "epoch": 58.0, "eval_LOCATION_f1": 0.7692307692307694, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7058823529411765, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7702702702702702, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6867469879518072, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7733333333333333, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6904761904761905, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14496611058712006, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8262032085561497, "eval_overall_precision": 0.770573566084788, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.327, "eval_samples_per_second": 571.822, "eval_steps_per_second": 9.174, "step": 6148 }, { "epoch": 59.0, "grad_norm": 2.0102553367614746, "learning_rate": 2.05e-05, "loss": 0.0513, "step": 6254 }, { "epoch": 59.0, "eval_LOCATION_f1": 0.7532467532467533, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6987951807228916, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7692307692307692, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6593406593406593, "eval_ORGANIZATION_recall": 0.9230769230769231, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.912280701754386, "eval_TIME_number": 28, "eval_TIME_precision": 0.896551724137931, "eval_TIME_recall": 0.9285714285714286, "eval_loss": 0.147059828042984, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8302387267904509, "eval_overall_precision": 0.769041769041769, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3282, "eval_samples_per_second": 569.709, "eval_steps_per_second": 9.14, "step": 6254 }, { "epoch": 60.0, "grad_norm": 1.5348504781723022, "learning_rate": 2e-05, "loss": 0.0524, "step": 6360 }, { "epoch": 60.0, "eval_LOCATION_f1": 0.7631578947368421, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7160493827160493, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6704545454545454, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.888178913738019, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14413262903690338, "eval_overall_accuracy": 0.9599903006789525, "eval_overall_f1": 0.8273092369477911, "eval_overall_precision": 0.7725, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.327, "eval_samples_per_second": 571.842, "eval_steps_per_second": 9.174, "step": 6360 }, { "epoch": 61.0, "grad_norm": 1.0918995141983032, "learning_rate": 1.9500000000000003e-05, "loss": 0.0523, "step": 6466 }, { "epoch": 61.0, "eval_LOCATION_f1": 0.7581699346405228, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7073170731707317, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7564102564102564, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6483516483516484, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.888888888888889, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8484848484848485, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15414579212665558, "eval_overall_accuracy": 0.9585354025218235, "eval_overall_f1": 0.8222811671087533, "eval_overall_precision": 0.7616707616707616, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3259, "eval_samples_per_second": 573.773, "eval_steps_per_second": 9.205, "step": 6466 }, { "epoch": 62.0, "grad_norm": 0.9440881013870239, "learning_rate": 1.9e-05, "loss": 0.0531, "step": 6572 }, { "epoch": 62.0, "eval_LOCATION_f1": 0.7814569536423841, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7375, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15256355702877045, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8306451612903226, "eval_overall_precision": 0.7783375314861462, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.326, "eval_samples_per_second": 573.658, "eval_steps_per_second": 9.203, "step": 6572 }, { "epoch": 63.0, "grad_norm": 1.0544549226760864, "learning_rate": 1.85e-05, "loss": 0.0495, "step": 6678 }, { "epoch": 63.0, "eval_LOCATION_f1": 0.7483870967741935, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.6904761904761905, "eval_LOCATION_recall": 0.8169014084507042, "eval_ORGANIZATION_f1": 0.7435897435897436, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6373626373626373, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8771929824561403, "eval_TIME_number": 28, "eval_TIME_precision": 0.8620689655172413, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1558208018541336, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8218085106382977, "eval_overall_precision": 0.762962962962963, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.327, "eval_samples_per_second": 571.805, "eval_steps_per_second": 9.173, "step": 6678 }, { "epoch": 64.0, "grad_norm": 0.0981023833155632, "learning_rate": 1.8e-05, "loss": 0.0503, "step": 6784 }, { "epoch": 64.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7733333333333333, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6904761904761905, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15108107030391693, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8293333333333333, "eval_overall_precision": 0.771712158808933, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3276, "eval_samples_per_second": 570.896, "eval_steps_per_second": 9.159, "step": 6784 }, { "epoch": 65.0, "grad_norm": 0.6967347264289856, "learning_rate": 1.75e-05, "loss": 0.0517, "step": 6890 }, { "epoch": 65.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7702702702702702, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6867469879518072, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.8910256410256411, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8580246913580247, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14456935226917267, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8317631224764469, "eval_overall_precision": 0.7803030303030303, "eval_overall_recall": 0.8904899135446686, "eval_runtime": 0.3275, "eval_samples_per_second": 570.976, "eval_steps_per_second": 9.16, "step": 6890 }, { "epoch": 66.0, "grad_norm": 0.616130530834198, "learning_rate": 1.7000000000000003e-05, "loss": 0.0493, "step": 6996 }, { "epoch": 66.0, "eval_LOCATION_f1": 0.7875000000000001, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7078651685393258, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7532467532467532, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.651685393258427, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7272727272727273, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6363636363636364, "eval_QUANTITY_recall": 0.8484848484848485, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16076360642910004, "eval_overall_accuracy": 0.9570805043646945, "eval_overall_f1": 0.8236842105263158, "eval_overall_precision": 0.7578692493946732, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3273, "eval_samples_per_second": 571.374, "eval_steps_per_second": 9.166, "step": 6996 }, { "epoch": 67.0, "grad_norm": 0.8930002450942993, "learning_rate": 1.65e-05, "loss": 0.0508, "step": 7102 }, { "epoch": 67.0, "eval_LOCATION_f1": 0.7848101265822784, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7126436781609196, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7581699346405228, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6590909090909091, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.888178913738019, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7631578947368421, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6744186046511628, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1603231132030487, "eval_overall_accuracy": 0.957807953443259, "eval_overall_f1": 0.8232189973614775, "eval_overall_precision": 0.7591240875912408, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3264, "eval_samples_per_second": 572.961, "eval_steps_per_second": 9.192, "step": 7102 }, { "epoch": 68.0, "grad_norm": 0.3851192891597748, "learning_rate": 1.6000000000000003e-05, "loss": 0.0486, "step": 7208 }, { "epoch": 68.0, "eval_LOCATION_f1": 0.7612903225806451, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7023809523809523, "eval_LOCATION_recall": 0.8309859154929577, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7733333333333333, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6904761904761905, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14870406687259674, "eval_overall_accuracy": 0.9595053346265762, "eval_overall_f1": 0.8213333333333332, "eval_overall_precision": 0.7642679900744417, "eval_overall_recall": 0.8876080691642652, "eval_runtime": 0.3249, "eval_samples_per_second": 575.524, "eval_steps_per_second": 9.233, "step": 7208 }, { "epoch": 69.0, "grad_norm": 0.668571949005127, "learning_rate": 1.55e-05, "loss": 0.0475, "step": 7314 }, { "epoch": 69.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8945686900958466, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8588957055214724, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15184400975704193, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8353413654618473, "eval_overall_precision": 0.78, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3285, "eval_samples_per_second": 569.263, "eval_steps_per_second": 9.133, "step": 7314 }, { "epoch": 70.0, "grad_norm": 1.2341712713241577, "learning_rate": 1.5e-05, "loss": 0.0491, "step": 7420 }, { "epoch": 70.0, "eval_LOCATION_f1": 0.8133333333333335, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7721518987341772, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7837837837837838, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6987951807228916, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.14618448913097382, "eval_overall_accuracy": 0.9629000969932104, "eval_overall_f1": 0.8389715832205683, "eval_overall_precision": 0.7908163265306123, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3272, "eval_samples_per_second": 571.603, "eval_steps_per_second": 9.17, "step": 7420 }, { "epoch": 71.0, "grad_norm": 0.7431372404098511, "learning_rate": 1.45e-05, "loss": 0.0462, "step": 7526 }, { "epoch": 71.0, "eval_LOCATION_f1": 0.7848101265822784, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7126436781609196, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.888178913738019, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.852760736196319, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7733333333333333, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.6904761904761905, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1648775339126587, "eval_overall_accuracy": 0.9582929194956353, "eval_overall_f1": 0.8269484808454426, "eval_overall_precision": 0.7634146341463415, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3274, "eval_samples_per_second": 571.19, "eval_steps_per_second": 9.163, "step": 7526 }, { "epoch": 72.0, "grad_norm": 0.7144307494163513, "learning_rate": 1.4000000000000001e-05, "loss": 0.046, "step": 7632 }, { "epoch": 72.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7712418300653594, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6704545454545454, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.8903225806451613, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8625, "eval_PERSON_recall": 0.92, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.7999999999999999, "eval_TIME_number": 28, "eval_TIME_precision": 0.75, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1596042811870575, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8308921438082557, "eval_overall_precision": 0.7722772277227723, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3254, "eval_samples_per_second": 574.71, "eval_steps_per_second": 9.22, "step": 7632 }, { "epoch": 73.0, "grad_norm": 0.5636935830116272, "learning_rate": 1.3500000000000001e-05, "loss": 0.0453, "step": 7738 }, { "epoch": 73.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8938906752411575, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8633540372670807, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7837837837837839, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7073170731707317, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8474576271186439, "eval_TIME_number": 28, "eval_TIME_precision": 0.8064516129032258, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.1584891676902771, "eval_overall_accuracy": 0.9592628516003879, "eval_overall_f1": 0.8315508021390374, "eval_overall_precision": 0.7755610972568578, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3271, "eval_samples_per_second": 571.735, "eval_steps_per_second": 9.172, "step": 7738 }, { "epoch": 74.0, "grad_norm": 0.8465162515640259, "learning_rate": 1.3000000000000001e-05, "loss": 0.0467, "step": 7844 }, { "epoch": 74.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7516778523489933, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.8996763754045306, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8742138364779874, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1548159122467041, "eval_overall_accuracy": 0.9604752667313288, "eval_overall_f1": 0.8322147651006712, "eval_overall_precision": 0.7788944723618091, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3278, "eval_samples_per_second": 570.444, "eval_steps_per_second": 9.152, "step": 7844 }, { "epoch": 75.0, "grad_norm": 1.0343018770217896, "learning_rate": 1.25e-05, "loss": 0.0443, "step": 7950 }, { "epoch": 75.0, "eval_LOCATION_f1": 0.823529411764706, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7682926829268293, "eval_LOCATION_recall": 0.8873239436619719, "eval_ORGANIZATION_f1": 0.7368421052631579, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6436781609195402, "eval_ORGANIZATION_recall": 0.8615384615384616, "eval_PERSON_f1": 0.9025974025974027, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.879746835443038, "eval_PERSON_recall": 0.9266666666666666, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8135593220338982, "eval_TIME_number": 28, "eval_TIME_precision": 0.7741935483870968, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15346647799015045, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.8348993288590604, "eval_overall_precision": 0.7814070351758794, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3271, "eval_samples_per_second": 571.622, "eval_steps_per_second": 9.17, "step": 7950 }, { "epoch": 76.0, "grad_norm": 0.05382401496171951, "learning_rate": 1.2e-05, "loss": 0.0447, "step": 8056 }, { "epoch": 76.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7814569536423841, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.686046511627907, "eval_ORGANIZATION_recall": 0.9076923076923077, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8620689655172413, "eval_TIME_number": 28, "eval_TIME_precision": 0.8333333333333334, "eval_TIME_recall": 0.8928571428571429, "eval_loss": 0.16000644862651825, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8467741935483871, "eval_overall_precision": 0.7934508816120907, "eval_overall_recall": 0.9077809798270894, "eval_runtime": 0.326, "eval_samples_per_second": 573.613, "eval_steps_per_second": 9.202, "step": 8056 }, { "epoch": 77.0, "grad_norm": 9.811291694641113, "learning_rate": 1.1500000000000002e-05, "loss": 0.0441, "step": 8162 }, { "epoch": 77.0, "eval_LOCATION_f1": 0.7721518987341772, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7011494252873564, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7808219178082192, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.7037037037037037, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.8055555555555556, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.7435897435897436, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15801285207271576, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8371467025572005, "eval_overall_precision": 0.7853535353535354, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.328, "eval_samples_per_second": 570.116, "eval_steps_per_second": 9.146, "step": 8162 }, { "epoch": 78.0, "grad_norm": 1.3943322896957397, "learning_rate": 1.1000000000000001e-05, "loss": 0.0438, "step": 8268 }, { "epoch": 78.0, "eval_LOCATION_f1": 0.782051282051282, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7176470588235294, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7785234899328859, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6904761904761905, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15934574604034424, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8387096774193548, "eval_overall_precision": 0.7858942065491183, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3262, "eval_samples_per_second": 573.317, "eval_steps_per_second": 9.198, "step": 8268 }, { "epoch": 79.0, "grad_norm": 0.6321301460266113, "learning_rate": 1.05e-05, "loss": 0.0449, "step": 8374 }, { "epoch": 79.0, "eval_LOCATION_f1": 0.7843137254901961, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7317073170731707, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7651006711409396, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6785714285714286, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15974144637584686, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8367071524966262, "eval_overall_precision": 0.7868020304568528, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3286, "eval_samples_per_second": 569.091, "eval_steps_per_second": 9.13, "step": 8374 }, { "epoch": 80.0, "grad_norm": 0.5539495348930359, "learning_rate": 1e-05, "loss": 0.0436, "step": 8480 }, { "epoch": 80.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7785234899328859, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6904761904761905, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16229036450386047, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8421052631578949, "eval_overall_precision": 0.7918781725888325, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3259, "eval_samples_per_second": 573.851, "eval_steps_per_second": 9.206, "step": 8480 }, { "epoch": 81.0, "grad_norm": 3.007709503173828, "learning_rate": 9.5e-06, "loss": 0.0434, "step": 8586 }, { "epoch": 81.0, "eval_LOCATION_f1": 0.8, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7380952380952381, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7581699346405228, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6590909090909091, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8275862068965518, "eval_TIME_number": 28, "eval_TIME_precision": 0.8, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1612003743648529, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.835781041388518, "eval_overall_precision": 0.7786069651741293, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3275, "eval_samples_per_second": 571.067, "eval_steps_per_second": 9.162, "step": 8586 }, { "epoch": 82.0, "grad_norm": 1.6446222066879272, "learning_rate": 9e-06, "loss": 0.0428, "step": 8692 }, { "epoch": 82.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7586206896551724, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6875, "eval_ORGANIZATION_recall": 0.8461538461538461, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15457752346992493, "eval_overall_accuracy": 0.9616876818622696, "eval_overall_f1": 0.8401084010840109, "eval_overall_precision": 0.7928388746803069, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3262, "eval_samples_per_second": 573.188, "eval_steps_per_second": 9.196, "step": 8692 }, { "epoch": 83.0, "grad_norm": 0.6172337532043457, "learning_rate": 8.500000000000002e-06, "loss": 0.043, "step": 8798 }, { "epoch": 83.0, "eval_LOCATION_f1": 0.7792207792207793, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7228915662650602, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.76, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6705882352941176, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16485904157161713, "eval_overall_accuracy": 0.9590203685741998, "eval_overall_f1": 0.8344549125168236, "eval_overall_precision": 0.7828282828282829, "eval_overall_recall": 0.8933717579250721, "eval_runtime": 0.3271, "eval_samples_per_second": 571.666, "eval_steps_per_second": 9.171, "step": 8798 }, { "epoch": 84.0, "grad_norm": 0.48714974522590637, "learning_rate": 8.000000000000001e-06, "loss": 0.0451, "step": 8904 }, { "epoch": 84.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7755102040816327, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6951219512195121, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15948227047920227, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8421052631578949, "eval_overall_precision": 0.7918781725888325, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3279, "eval_samples_per_second": 570.348, "eval_steps_per_second": 9.15, "step": 8904 }, { "epoch": 85.0, "grad_norm": 0.8867198824882507, "learning_rate": 7.5e-06, "loss": 0.0444, "step": 9010 }, { "epoch": 85.0, "eval_LOCATION_f1": 0.8051948051948051, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7469879518072289, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16462980210781097, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8413978494623656, "eval_overall_precision": 0.7884130982367759, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3281, "eval_samples_per_second": 569.983, "eval_steps_per_second": 9.144, "step": 9010 }, { "epoch": 86.0, "grad_norm": 0.4750601649284363, "learning_rate": 7.000000000000001e-06, "loss": 0.0406, "step": 9116 }, { "epoch": 86.0, "eval_LOCATION_f1": 0.8026315789473684, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7530864197530864, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7702702702702702, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6867469879518072, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9096774193548387, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.88125, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15999138355255127, "eval_overall_accuracy": 0.9619301648884578, "eval_overall_f1": 0.8432432432432433, "eval_overall_precision": 0.7938931297709924, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3277, "eval_samples_per_second": 570.57, "eval_steps_per_second": 9.154, "step": 9116 }, { "epoch": 87.0, "grad_norm": 0.6775397658348083, "learning_rate": 6.5000000000000004e-06, "loss": 0.0415, "step": 9222 }, { "epoch": 87.0, "eval_LOCATION_f1": 0.8104575163398693, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7560975609756098, "eval_LOCATION_recall": 0.8732394366197183, "eval_ORGANIZATION_f1": 0.7785234899328859, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6904761904761905, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16279393434524536, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8413978494623656, "eval_overall_precision": 0.7884130982367759, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3261, "eval_samples_per_second": 573.372, "eval_steps_per_second": 9.198, "step": 9222 }, { "epoch": 88.0, "grad_norm": 0.4834389090538025, "learning_rate": 6e-06, "loss": 0.0407, "step": 9328 }, { "epoch": 88.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7682119205298013, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6744186046511628, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9061488673139159, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8805031446540881, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8571428571428571, "eval_TIME_number": 28, "eval_TIME_precision": 0.8571428571428571, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1641407161951065, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8409703504043127, "eval_overall_precision": 0.789873417721519, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3268, "eval_samples_per_second": 572.15, "eval_steps_per_second": 9.179, "step": 9328 }, { "epoch": 89.0, "grad_norm": 3.0661368370056152, "learning_rate": 5.500000000000001e-06, "loss": 0.0426, "step": 9434 }, { "epoch": 89.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7733333333333334, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6823529411764706, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9067524115755627, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8757763975155279, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1607460379600525, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8413978494623656, "eval_overall_precision": 0.7884130982367759, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3275, "eval_samples_per_second": 571.022, "eval_steps_per_second": 9.161, "step": 9434 }, { "epoch": 90.0, "grad_norm": 0.5167478919029236, "learning_rate": 5e-06, "loss": 0.041, "step": 9540 }, { "epoch": 90.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7837837837837838, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6987951807228916, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16166909039020538, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8421052631578949, "eval_overall_precision": 0.7918781725888325, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3276, "eval_samples_per_second": 570.818, "eval_steps_per_second": 9.158, "step": 9540 }, { "epoch": 91.0, "grad_norm": 0.6979191303253174, "learning_rate": 4.5e-06, "loss": 0.0406, "step": 9646 }, { "epoch": 91.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16465260088443756, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8375838926174496, "eval_overall_precision": 0.7839195979899497, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3268, "eval_samples_per_second": 572.184, "eval_steps_per_second": 9.179, "step": 9646 }, { "epoch": 92.0, "grad_norm": 0.35358938574790955, "learning_rate": 4.000000000000001e-06, "loss": 0.0408, "step": 9752 }, { "epoch": 92.0, "eval_LOCATION_f1": 0.7894736842105262, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7407407407407407, "eval_LOCATION_recall": 0.8450704225352113, "eval_ORGANIZATION_f1": 0.7702702702702702, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6867469879518072, "eval_ORGANIZATION_recall": 0.8769230769230769, "eval_PERSON_f1": 0.9067524115755627, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8757763975155279, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.15703369677066803, "eval_overall_accuracy": 0.962172647914646, "eval_overall_f1": 0.8394062078272604, "eval_overall_precision": 0.7893401015228426, "eval_overall_recall": 0.8962536023054755, "eval_runtime": 0.3273, "eval_samples_per_second": 571.285, "eval_steps_per_second": 9.165, "step": 9752 }, { "epoch": 93.0, "grad_norm": 0.4786812365055084, "learning_rate": 3.5000000000000004e-06, "loss": 0.0411, "step": 9858 }, { "epoch": 93.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9067524115755627, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8757763975155279, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1660545915365219, "eval_overall_accuracy": 0.960717749757517, "eval_overall_f1": 0.8380187416331996, "eval_overall_precision": 0.7825, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.328, "eval_samples_per_second": 570.159, "eval_steps_per_second": 9.147, "step": 9858 }, { "epoch": 94.0, "grad_norm": 0.8427369594573975, "learning_rate": 3e-06, "loss": 0.04, "step": 9964 }, { "epoch": 94.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16458158195018768, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8375838926174496, "eval_overall_precision": 0.7839195979899497, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.327, "eval_samples_per_second": 571.854, "eval_steps_per_second": 9.174, "step": 9964 }, { "epoch": 95.0, "grad_norm": 1.0689115524291992, "learning_rate": 2.5e-06, "loss": 0.0372, "step": 10070 }, { "epoch": 95.0, "eval_LOCATION_f1": 0.7922077922077921, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7349397590361446, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9067524115755627, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8757763975155279, "eval_PERSON_recall": 0.94, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16513913869857788, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8380187416331996, "eval_overall_precision": 0.7825, "eval_overall_recall": 0.9020172910662824, "eval_runtime": 0.3273, "eval_samples_per_second": 571.379, "eval_steps_per_second": 9.167, "step": 10070 }, { "epoch": 96.0, "grad_norm": 0.6339386105537415, "learning_rate": 2.0000000000000003e-06, "loss": 0.0393, "step": 10176 }, { "epoch": 96.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.8974358974358974, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.8641975308641975, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1637803018093109, "eval_overall_accuracy": 0.9614451988360815, "eval_overall_f1": 0.8353413654618473, "eval_overall_precision": 0.78, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3261, "eval_samples_per_second": 573.445, "eval_steps_per_second": 9.2, "step": 10176 }, { "epoch": 97.0, "grad_norm": 0.6922338604927063, "learning_rate": 1.5e-06, "loss": 0.0396, "step": 10282 }, { "epoch": 97.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16408979892730713, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8375838926174496, "eval_overall_precision": 0.7839195979899497, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3277, "eval_samples_per_second": 570.597, "eval_steps_per_second": 9.154, "step": 10282 }, { "epoch": 98.0, "grad_norm": 1.161203384399414, "learning_rate": 1.0000000000000002e-06, "loss": 0.0385, "step": 10388 }, { "epoch": 98.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1643643081188202, "eval_overall_accuracy": 0.9609602327837051, "eval_overall_f1": 0.8375838926174496, "eval_overall_precision": 0.7839195979899497, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3284, "eval_samples_per_second": 569.344, "eval_steps_per_second": 9.134, "step": 10388 }, { "epoch": 99.0, "grad_norm": 0.5302362442016602, "learning_rate": 5.000000000000001e-07, "loss": 0.0382, "step": 10494 }, { "epoch": 99.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.1647883802652359, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8375838926174496, "eval_overall_precision": 0.7839195979899497, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3268, "eval_samples_per_second": 572.201, "eval_steps_per_second": 9.18, "step": 10494 }, { "epoch": 100.0, "grad_norm": 0.16222168505191803, "learning_rate": 0.0, "loss": 0.0411, "step": 10600 }, { "epoch": 100.0, "eval_LOCATION_f1": 0.7973856209150327, "eval_LOCATION_number": 71, "eval_LOCATION_precision": 0.7439024390243902, "eval_LOCATION_recall": 0.8591549295774648, "eval_ORGANIZATION_f1": 0.7631578947368421, "eval_ORGANIZATION_number": 65, "eval_ORGANIZATION_precision": 0.6666666666666666, "eval_ORGANIZATION_recall": 0.8923076923076924, "eval_PERSON_f1": 0.9032258064516129, "eval_PERSON_number": 150, "eval_PERSON_precision": 0.875, "eval_PERSON_recall": 0.9333333333333333, "eval_QUANTITY_f1": 0.7945205479452054, "eval_QUANTITY_number": 33, "eval_QUANTITY_precision": 0.725, "eval_QUANTITY_recall": 0.8787878787878788, "eval_TIME_f1": 0.8421052631578947, "eval_TIME_number": 28, "eval_TIME_precision": 0.8275862068965517, "eval_TIME_recall": 0.8571428571428571, "eval_loss": 0.16485615074634552, "eval_overall_accuracy": 0.9612027158098934, "eval_overall_f1": 0.8375838926174496, "eval_overall_precision": 0.7839195979899497, "eval_overall_recall": 0.899135446685879, "eval_runtime": 0.3263, "eval_samples_per_second": 573.127, "eval_steps_per_second": 9.195, "step": 10600 }, { "epoch": 100.0, "step": 10600, "total_flos": 5123217774191952.0, "train_loss": 0.08768324019773951, "train_runtime": 561.3026, "train_samples_per_second": 300.729, "train_steps_per_second": 18.885 } ], "logging_steps": 500, "max_steps": 10600, "num_input_tokens_seen": 0, "num_train_epochs": 100, "save_steps": 500, "total_flos": 5123217774191952.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }