|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 2.6862921714782715, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9792, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.18095238095238095, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.31666666666666665, |
|
"eval_PERSON_recall": 0.12666666666666668, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.06666666666666667, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.5, |
|
"eval_TIME_recall": 0.03571428571428571, |
|
"eval_loss": 0.5512092113494873, |
|
"eval_overall_accuracy": 0.850387972841901, |
|
"eval_overall_f1": 0.09501187648456057, |
|
"eval_overall_precision": 0.2702702702702703, |
|
"eval_overall_recall": 0.05763688760806916, |
|
"eval_runtime": 0.3324, |
|
"eval_samples_per_second": 562.651, |
|
"eval_steps_per_second": 9.026, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.0679957866668701, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.4837, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.41739130434782606, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5454545454545454, |
|
"eval_LOCATION_recall": 0.3380281690140845, |
|
"eval_ORGANIZATION_f1": 0.019801980198019802, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.027777777777777776, |
|
"eval_ORGANIZATION_recall": 0.015384615384615385, |
|
"eval_PERSON_f1": 0.6831955922865013, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.5821596244131455, |
|
"eval_PERSON_recall": 0.8266666666666667, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.5454545454545454, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.47368421052631576, |
|
"eval_TIME_recall": 0.6428571428571429, |
|
"eval_loss": 0.33068543672561646, |
|
"eval_overall_accuracy": 0.9022793404461688, |
|
"eval_overall_f1": 0.4798850574712644, |
|
"eval_overall_precision": 0.4785100286532951, |
|
"eval_overall_recall": 0.4812680115273775, |
|
"eval_runtime": 0.3251, |
|
"eval_samples_per_second": 575.209, |
|
"eval_steps_per_second": 9.228, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 0.8312263488769531, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.3133, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.5306122448979592, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5131578947368421, |
|
"eval_LOCATION_recall": 0.5492957746478874, |
|
"eval_ORGANIZATION_f1": 0.4000000000000001, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.34444444444444444, |
|
"eval_ORGANIZATION_recall": 0.47692307692307695, |
|
"eval_PERSON_f1": 0.7710843373493976, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7032967032967034, |
|
"eval_PERSON_recall": 0.8533333333333334, |
|
"eval_QUANTITY_f1": 0.5194805194805195, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.45454545454545453, |
|
"eval_QUANTITY_recall": 0.6060606060606061, |
|
"eval_TIME_f1": 0.793103448275862, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7666666666666667, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.21400973200798035, |
|
"eval_overall_accuracy": 0.9308923375363725, |
|
"eval_overall_f1": 0.6267880364109232, |
|
"eval_overall_precision": 0.5710900473933649, |
|
"eval_overall_recall": 0.6945244956772334, |
|
"eval_runtime": 0.3261, |
|
"eval_samples_per_second": 573.482, |
|
"eval_steps_per_second": 9.2, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.0169802904129028, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2327, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.6436781609195402, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5436893203883495, |
|
"eval_LOCATION_recall": 0.7887323943661971, |
|
"eval_ORGANIZATION_f1": 0.5590062111801243, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.46875, |
|
"eval_ORGANIZATION_recall": 0.6923076923076923, |
|
"eval_PERSON_f1": 0.8421052631578947, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7861271676300579, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.5897435897435898, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5111111111111111, |
|
"eval_QUANTITY_recall": 0.696969696969697, |
|
"eval_TIME_f1": 0.7719298245614034, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7586206896551724, |
|
"eval_TIME_recall": 0.7857142857142857, |
|
"eval_loss": 0.17442111670970917, |
|
"eval_overall_accuracy": 0.9408341416100873, |
|
"eval_overall_f1": 0.7112232030264818, |
|
"eval_overall_precision": 0.6322869955156951, |
|
"eval_overall_recall": 0.8126801152737753, |
|
"eval_runtime": 0.3287, |
|
"eval_samples_per_second": 568.904, |
|
"eval_steps_per_second": 9.127, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.3268284797668457, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.1989, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.7215189873417721, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6551724137931034, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.6493506493506495, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5617977528089888, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8652037617554857, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8165680473372781, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6329113924050633, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5434782608695652, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.7796610169491526, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7419354838709677, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.1507454365491867, |
|
"eval_overall_accuracy": 0.9481086323957323, |
|
"eval_overall_f1": 0.7620286085825748, |
|
"eval_overall_precision": 0.6943127962085308, |
|
"eval_overall_recall": 0.8443804034582133, |
|
"eval_runtime": 0.3267, |
|
"eval_samples_per_second": 572.456, |
|
"eval_steps_per_second": 9.184, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.4492706060409546, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1782, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7088607594936709, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6436781609195402, |
|
"eval_LOCATION_recall": 0.7887323943661971, |
|
"eval_ORGANIZATION_f1": 0.6473988439306357, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5185185185185185, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8598130841121495, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8070175438596491, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6352941176470589, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5192307692307693, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.746268656716418, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6410256410256411, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17294442653656006, |
|
"eval_overall_accuracy": 0.9425315227934045, |
|
"eval_overall_f1": 0.7512437810945274, |
|
"eval_overall_precision": 0.6608315098468271, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.852, |
|
"eval_steps_per_second": 9.174, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 2.372952938079834, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1675, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7407407407407407, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6593406593406593, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.675, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5684210526315789, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8706624605678233, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8263473053892215, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7179487179487178, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6222222222222222, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1436489075422287, |
|
"eval_overall_accuracy": 0.950533462657614, |
|
"eval_overall_f1": 0.7784891165172856, |
|
"eval_overall_precision": 0.7004608294930875, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3264, |
|
"eval_samples_per_second": 572.836, |
|
"eval_steps_per_second": 9.19, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.5531976222991943, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1523, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7643312101910827, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6976744186046512, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.6832298136645962, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5729166666666666, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8670886075949367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8253012048192772, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7936507936507937, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1423933058977127, |
|
"eval_overall_accuracy": 0.9527158098933075, |
|
"eval_overall_f1": 0.7891332470892625, |
|
"eval_overall_precision": 0.715962441314554, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3281, |
|
"eval_samples_per_second": 570.034, |
|
"eval_steps_per_second": 9.145, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.0425461530685425, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.148, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7466666666666668, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6588235294117647, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8690095846645367, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8343558282208589, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5777777777777777, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13000667095184326, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8015873015873015, |
|
"eval_overall_precision": 0.7408312958435208, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3275, |
|
"eval_samples_per_second": 571.032, |
|
"eval_steps_per_second": 9.161, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 0.9898656606674194, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1376, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7088607594936709, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6086956521739131, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12935131788253784, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8131578947368422, |
|
"eval_overall_precision": 0.7481840193704601, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3271, |
|
"eval_samples_per_second": 571.762, |
|
"eval_steps_per_second": 9.173, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 1.2879328727722168, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1378, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7532467532467533, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6987951807228916, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.728476821192053, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6395348837209303, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12860190868377686, |
|
"eval_overall_accuracy": 0.9565955383123181, |
|
"eval_overall_f1": 0.8063660477453581, |
|
"eval_overall_precision": 0.7469287469287469, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3281, |
|
"eval_samples_per_second": 570.029, |
|
"eval_steps_per_second": 9.145, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.0456236600875854, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1279, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.728395061728395, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6483516483516484, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7375, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6210526315789474, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.6865671641791046, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.5897435897435898, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.14702975749969482, |
|
"eval_overall_accuracy": 0.9524733268671193, |
|
"eval_overall_f1": 0.7953667953667953, |
|
"eval_overall_precision": 0.7186046511627907, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.329, |
|
"eval_samples_per_second": 568.322, |
|
"eval_steps_per_second": 9.117, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.7470729351043701, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1257, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.7763157894736843, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8917197452229298, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8070175438596492, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7931034482758621, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.12572742998600006, |
|
"eval_overall_accuracy": 0.9597478176527643, |
|
"eval_overall_f1": 0.823529411764706, |
|
"eval_overall_precision": 0.7680798004987531, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.326, |
|
"eval_samples_per_second": 573.579, |
|
"eval_steps_per_second": 9.202, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.587265133857727, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1211, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.7643312101910827, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6976744186046512, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6704545454545454, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.6956521739130435, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.5853658536585366, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12821051478385925, |
|
"eval_overall_accuracy": 0.9565955383123181, |
|
"eval_overall_f1": 0.8031290743155148, |
|
"eval_overall_precision": 0.7333333333333333, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3277, |
|
"eval_samples_per_second": 570.653, |
|
"eval_steps_per_second": 9.155, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.1898987293243408, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1182, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.794701986754967, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7532467532467532, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.651685393258427, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12380851060152054, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8255659121171772, |
|
"eval_overall_precision": 0.7673267326732673, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3297, |
|
"eval_samples_per_second": 567.219, |
|
"eval_steps_per_second": 9.1, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 1.2394359111785889, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1084, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.7733333333333333, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7341772151898734, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6704545454545454, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12522907555103302, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8180610889774237, |
|
"eval_overall_precision": 0.7586206896551724, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3284, |
|
"eval_samples_per_second": 569.484, |
|
"eval_steps_per_second": 9.136, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.5448505878448486, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.11, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7428571428571429, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6933333333333334, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8917197452229298, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.11857786774635315, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8243243243243243, |
|
"eval_overall_precision": 0.7760814249363868, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3269, |
|
"eval_samples_per_second": 572.103, |
|
"eval_steps_per_second": 9.178, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.928116500377655, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.105, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.7843137254901961, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7402597402597403, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6404494382022472, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13439632952213287, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8153034300791556, |
|
"eval_overall_precision": 0.7518248175182481, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3276, |
|
"eval_samples_per_second": 570.855, |
|
"eval_steps_per_second": 9.158, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.6120880246162415, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.1012, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7435897435897436, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.76, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6705882352941176, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1134907528758049, |
|
"eval_overall_accuracy": 0.9643549951503395, |
|
"eval_overall_f1": 0.8299319727891157, |
|
"eval_overall_precision": 0.7860824742268041, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3267, |
|
"eval_samples_per_second": 572.422, |
|
"eval_steps_per_second": 9.183, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.7189091444015503, |
|
"learning_rate": 4e-05, |
|
"loss": 0.1009, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.763888888888889, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6962025316455697, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.11710327118635178, |
|
"eval_overall_accuracy": 0.9636275460717749, |
|
"eval_overall_f1": 0.8324324324324324, |
|
"eval_overall_precision": 0.7837150127226463, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3264, |
|
"eval_samples_per_second": 572.982, |
|
"eval_steps_per_second": 9.192, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 1.2998398542404175, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0994, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.7777777777777779, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6923076923076923, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7972027972027972, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7307692307692307, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9038461538461539, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5957446808510638, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1276998519897461, |
|
"eval_overall_accuracy": 0.9597478176527643, |
|
"eval_overall_f1": 0.8295904887714662, |
|
"eval_overall_precision": 0.7658536585365854, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.3284, |
|
"eval_samples_per_second": 569.448, |
|
"eval_steps_per_second": 9.136, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.8688408136367798, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0947, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.7530864197530862, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6703296703296703, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.759493670886076, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6451612903225806, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6829268292682927, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5714285714285714, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14317628741264343, |
|
"eval_overall_accuracy": 0.9536857419980601, |
|
"eval_overall_f1": 0.8067010309278351, |
|
"eval_overall_precision": 0.7296037296037297, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3269, |
|
"eval_samples_per_second": 571.972, |
|
"eval_steps_per_second": 9.176, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 1.058230996131897, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0922, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8025477707006369, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6704545454545454, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8000000000000002, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7567567567567568, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.11902488023042679, |
|
"eval_overall_accuracy": 0.9643549951503395, |
|
"eval_overall_f1": 0.84, |
|
"eval_overall_precision": 0.7816377171215881, |
|
"eval_overall_recall": 0.9077809798270894, |
|
"eval_runtime": 0.3269, |
|
"eval_samples_per_second": 572.066, |
|
"eval_steps_per_second": 9.178, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.2606264352798462, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0917, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.7530864197530862, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6703296703296703, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7534246575342466, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6790123456790124, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13196653127670288, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8186666666666667, |
|
"eval_overall_precision": 0.7617866004962779, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.298, |
|
"eval_steps_per_second": 9.165, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.8119063973426819, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0895, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.7625, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6853932584269663, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7755102040816327, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6951219512195121, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12873846292495728, |
|
"eval_overall_accuracy": 0.9599903006789525, |
|
"eval_overall_f1": 0.8233731739707836, |
|
"eval_overall_precision": 0.7635467980295566, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3259, |
|
"eval_samples_per_second": 573.763, |
|
"eval_steps_per_second": 9.205, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.6412087082862854, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0915, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.759493670886076, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7483870967741936, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6444444444444445, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6363636363636364, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12941302359104156, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8244680851063829, |
|
"eval_overall_precision": 0.7654320987654321, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3264, |
|
"eval_samples_per_second": 572.875, |
|
"eval_steps_per_second": 9.191, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 1.1233749389648438, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0857, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.775, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6966292134831461, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7662337662337663, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6629213483146067, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9067524115755627, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.6428571428571428, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5294117647058824, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.78125, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6944444444444444, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14580127596855164, |
|
"eval_overall_accuracy": 0.9553831231813773, |
|
"eval_overall_f1": 0.8124191461836998, |
|
"eval_overall_precision": 0.7370892018779343, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.3274, |
|
"eval_samples_per_second": 571.119, |
|
"eval_steps_per_second": 9.162, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 2.415337085723877, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0846, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.7837837837837838, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7532467532467533, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7763157894736842, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6781609195402298, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9009584664536742, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12516556680202484, |
|
"eval_overall_accuracy": 0.9636275460717749, |
|
"eval_overall_f1": 0.8337801608579088, |
|
"eval_overall_precision": 0.7794486215538847, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.332, |
|
"eval_steps_per_second": 9.166, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.36568284034729004, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0828, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7361963190184049, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6122448979591837, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12355955690145493, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8289473684210527, |
|
"eval_overall_precision": 0.7627118644067796, |
|
"eval_overall_recall": 0.9077809798270894, |
|
"eval_runtime": 0.3266, |
|
"eval_samples_per_second": 572.645, |
|
"eval_steps_per_second": 9.187, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 2.264235019683838, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.081, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7317073170731707, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6060606060606061, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13108646869659424, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8241469816272966, |
|
"eval_overall_precision": 0.7566265060240964, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.3263, |
|
"eval_samples_per_second": 573.006, |
|
"eval_steps_per_second": 9.193, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.646797239780426, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0782, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.7530864197530862, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6703296703296703, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7532467532467532, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.651685393258427, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13420291244983673, |
|
"eval_overall_accuracy": 0.9599903006789525, |
|
"eval_overall_f1": 0.8167539267015707, |
|
"eval_overall_precision": 0.7482014388489209, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.836, |
|
"eval_steps_per_second": 9.174, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.6615414023399353, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0812, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.751592356687898, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.686046511627907, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7483870967741936, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6444444444444445, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12814216315746307, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8174603174603176, |
|
"eval_overall_precision": 0.7555012224938875, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.795, |
|
"eval_steps_per_second": 9.173, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 1.0747178792953491, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0759, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.7612903225806451, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7023809523809523, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.782051282051282, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6703296703296703, |
|
"eval_ORGANIZATION_recall": 0.9384615384615385, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12921784818172455, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8269484808454426, |
|
"eval_overall_precision": 0.7634146341463415, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3274, |
|
"eval_samples_per_second": 571.082, |
|
"eval_steps_per_second": 9.162, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 0.9548816084861755, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0755, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7916666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7215189873417721, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.12423999607563019, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8279569892473119, |
|
"eval_overall_precision": 0.7758186397984886, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3276, |
|
"eval_samples_per_second": 570.793, |
|
"eval_steps_per_second": 9.157, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.42714256048202515, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0739, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.751592356687898, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.686046511627907, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7453416149068324, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13675132393836975, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8141361256544503, |
|
"eval_overall_precision": 0.7458033573141487, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3266, |
|
"eval_samples_per_second": 572.553, |
|
"eval_steps_per_second": 9.185, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 1.520427942276001, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0754, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7672955974842768, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.648936170212766, |
|
"eval_ORGANIZATION_recall": 0.9384615384615385, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1319383829832077, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8289473684210527, |
|
"eval_overall_precision": 0.7627118644067796, |
|
"eval_overall_recall": 0.9077809798270894, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.333, |
|
"eval_steps_per_second": 9.166, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 0.7817038893699646, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0703, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.7530864197530862, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6703296703296703, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7402597402597403, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6404494382022472, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8980891719745222, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1478222757577896, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8093994778067884, |
|
"eval_overall_precision": 0.7398568019093079, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3267, |
|
"eval_samples_per_second": 572.415, |
|
"eval_steps_per_second": 9.183, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.6990446448326111, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0735, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8181818181818181, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12963485717773438, |
|
"eval_overall_accuracy": 0.9624151309408342, |
|
"eval_overall_f1": 0.8249336870026525, |
|
"eval_overall_precision": 0.7641277641277642, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.9, |
|
"eval_steps_per_second": 9.175, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 1.1196815967559814, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0718, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.7402597402597403, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6867469879518072, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7375, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6210526315789474, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9038461538461539, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13455747067928314, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8190224570673712, |
|
"eval_overall_precision": 0.7560975609756098, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.347, |
|
"eval_steps_per_second": 9.166, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.904691219329834, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0694, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.7733333333333333, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7341772151898734, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7333333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7733333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6904761904761905, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1319706290960312, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8186666666666667, |
|
"eval_overall_precision": 0.7617866004962779, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3287, |
|
"eval_samples_per_second": 568.914, |
|
"eval_steps_per_second": 9.127, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.4921020567417145, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0693, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.7435897435897436, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6823529411764706, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7515923566878981, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6413043478260869, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.912621359223301, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7733333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6904761904761905, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14422298967838287, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8253968253968255, |
|
"eval_overall_precision": 0.7628361858190709, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.269, |
|
"eval_steps_per_second": 9.181, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.17059876024723053, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0675, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.7763157894736843, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7866666666666665, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6941176470588235, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13859502971172333, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8266666666666667, |
|
"eval_overall_precision": 0.7692307692307693, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3267, |
|
"eval_samples_per_second": 572.428, |
|
"eval_steps_per_second": 9.183, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.5693849325180054, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0672, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.7692307692307694, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13775749504566193, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8243064729194188, |
|
"eval_overall_precision": 0.7609756097560976, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.326, |
|
"eval_samples_per_second": 573.554, |
|
"eval_steps_per_second": 9.201, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 0.5870493650436401, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.067, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.7866666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6704545454545454, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8285714285714285, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7837837837837838, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13134053349494934, |
|
"eval_overall_accuracy": 0.9626576139670223, |
|
"eval_overall_f1": 0.8315508021390374, |
|
"eval_overall_precision": 0.7755610972568578, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.903, |
|
"eval_steps_per_second": 9.175, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 1.1741827726364136, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0656, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7837837837837838, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6987951807228916, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13948975503444672, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8320000000000001, |
|
"eval_overall_precision": 0.7741935483870968, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3274, |
|
"eval_samples_per_second": 571.187, |
|
"eval_steps_per_second": 9.163, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.8152003288269043, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0656, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.7662337662337662, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7108433734939759, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7450980392156863, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6477272727272727, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13262593746185303, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8222811671087533, |
|
"eval_overall_precision": 0.7616707616707616, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3275, |
|
"eval_samples_per_second": 571.056, |
|
"eval_steps_per_second": 9.161, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.9389750361442566, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.062, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.7421383647798742, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6704545454545454, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7450980392156863, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6477272727272727, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8924050632911392, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8493975903614458, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15109694004058838, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.81151832460733, |
|
"eval_overall_precision": 0.7434052757793765, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3278, |
|
"eval_samples_per_second": 570.556, |
|
"eval_steps_per_second": 9.153, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 1.3758347034454346, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0638, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.7875000000000001, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7078651685393258, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7733333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6904761904761905, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1447124034166336, |
|
"eval_overall_accuracy": 0.9597478176527643, |
|
"eval_overall_f1": 0.8221343873517787, |
|
"eval_overall_precision": 0.7572815533980582, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.823, |
|
"eval_steps_per_second": 9.174, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.8612605333328247, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0601, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1353224217891693, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8288770053475935, |
|
"eval_overall_precision": 0.773067331670823, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3281, |
|
"eval_samples_per_second": 569.939, |
|
"eval_steps_per_second": 9.143, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 1.3004350662231445, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0604, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7549668874172185, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6627906976744186, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1338462084531784, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8315508021390374, |
|
"eval_overall_precision": 0.7755610972568578, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3278, |
|
"eval_samples_per_second": 570.522, |
|
"eval_steps_per_second": 9.153, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.871790885925293, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0582, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.7654320987654322, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6813186813186813, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7619047619047619, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6829268292682927, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9096774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.88125, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13927897810935974, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8302387267904509, |
|
"eval_overall_precision": 0.769041769041769, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3272, |
|
"eval_samples_per_second": 571.49, |
|
"eval_steps_per_second": 9.168, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.7292200326919556, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0608, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7295597484276729, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6170212765957447, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1517271101474762, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8153034300791556, |
|
"eval_overall_precision": 0.7518248175182481, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3279, |
|
"eval_samples_per_second": 570.258, |
|
"eval_steps_per_second": 9.149, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.8021668791770935, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0575, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.7466666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7088607594936709, |
|
"eval_LOCATION_recall": 0.7887323943661971, |
|
"eval_ORGANIZATION_f1": 0.7361963190184049, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6122448979591837, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8832807570977917, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8383233532934131, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15490397810935974, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8125819134993448, |
|
"eval_overall_precision": 0.7451923076923077, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3281, |
|
"eval_samples_per_second": 570.008, |
|
"eval_steps_per_second": 9.145, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 1.3401607275009155, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0585, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.7402597402597403, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6867469879518072, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7305389221556887, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5980392156862745, |
|
"eval_ORGANIZATION_recall": 0.9384615384615385, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.16088581085205078, |
|
"eval_overall_accuracy": 0.9541707080504365, |
|
"eval_overall_f1": 0.811443433029909, |
|
"eval_overall_precision": 0.7393364928909952, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3275, |
|
"eval_samples_per_second": 570.964, |
|
"eval_steps_per_second": 9.16, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 0.5186824202537537, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0571, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6551724137931034, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7733333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6904761904761905, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14577339589595795, |
|
"eval_overall_accuracy": 0.9599903006789525, |
|
"eval_overall_f1": 0.8282290279627165, |
|
"eval_overall_precision": 0.7698019801980198, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3267, |
|
"eval_samples_per_second": 572.313, |
|
"eval_steps_per_second": 9.181, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 1.0186669826507568, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0574, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.7848101265822784, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7126436781609196, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14299847185611725, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8308921438082557, |
|
"eval_overall_precision": 0.7722772277227723, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.282, |
|
"eval_steps_per_second": 9.181, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.6867424845695496, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0549, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.779874213836478, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7045454545454546, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7808219178082192, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7037037037037037, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8917197452229298, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14952713251113892, |
|
"eval_overall_accuracy": 0.9616876818622696, |
|
"eval_overall_f1": 0.8335552596537948, |
|
"eval_overall_precision": 0.7747524752475248, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.296, |
|
"eval_steps_per_second": 9.181, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.42461711168289185, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0534, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.7692307692307694, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7702702702702702, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6867469879518072, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7733333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6904761904761905, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14496611058712006, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8262032085561497, |
|
"eval_overall_precision": 0.770573566084788, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.822, |
|
"eval_steps_per_second": 9.174, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 2.0102553367614746, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0513, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.7532467532467533, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6987951807228916, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7692307692307692, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6593406593406593, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.912280701754386, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.147059828042984, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8302387267904509, |
|
"eval_overall_precision": 0.769041769041769, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3282, |
|
"eval_samples_per_second": 569.709, |
|
"eval_steps_per_second": 9.14, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 1.5348504781723022, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0524, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6704545454545454, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14413262903690338, |
|
"eval_overall_accuracy": 0.9599903006789525, |
|
"eval_overall_f1": 0.8273092369477911, |
|
"eval_overall_precision": 0.7725, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.842, |
|
"eval_steps_per_second": 9.174, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.0918995141983032, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0523, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.7581699346405228, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7073170731707317, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7564102564102564, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6483516483516484, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15414579212665558, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8222811671087533, |
|
"eval_overall_precision": 0.7616707616707616, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3259, |
|
"eval_samples_per_second": 573.773, |
|
"eval_steps_per_second": 9.205, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.9440881013870239, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0531, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.7814569536423841, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7375, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7682119205298013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6744186046511628, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15256355702877045, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8306451612903226, |
|
"eval_overall_precision": 0.7783375314861462, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.326, |
|
"eval_samples_per_second": 573.658, |
|
"eval_steps_per_second": 9.203, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 1.0544549226760864, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0495, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.7483870967741935, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6904761904761905, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7435897435897436, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6373626373626373, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1558208018541336, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8218085106382977, |
|
"eval_overall_precision": 0.762962962962963, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.805, |
|
"eval_steps_per_second": 9.173, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.0981023833155632, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0503, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7733333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6823529411764706, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7733333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6904761904761905, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15108107030391693, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8293333333333333, |
|
"eval_overall_precision": 0.771712158808933, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3276, |
|
"eval_samples_per_second": 570.896, |
|
"eval_steps_per_second": 9.159, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 0.6967347264289856, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0517, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.7843137254901961, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7702702702702702, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6867469879518072, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14456935226917267, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8317631224764469, |
|
"eval_overall_precision": 0.7803030303030303, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3275, |
|
"eval_samples_per_second": 570.976, |
|
"eval_steps_per_second": 9.16, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.616130530834198, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0493, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.7875000000000001, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7078651685393258, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7532467532467532, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.651685393258427, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6363636363636364, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16076360642910004, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8236842105263158, |
|
"eval_overall_precision": 0.7578692493946732, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.374, |
|
"eval_steps_per_second": 9.166, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.8930002450942993, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0508, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.7848101265822784, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7126436781609196, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7581699346405228, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6590909090909091, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7631578947368421, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6744186046511628, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1603231132030487, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8232189973614775, |
|
"eval_overall_precision": 0.7591240875912408, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3264, |
|
"eval_samples_per_second": 572.961, |
|
"eval_steps_per_second": 9.192, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.3851192891597748, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0486, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.7612903225806451, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7023809523809523, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7733333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6904761904761905, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14870406687259674, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.8213333333333332, |
|
"eval_overall_precision": 0.7642679900744417, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3249, |
|
"eval_samples_per_second": 575.524, |
|
"eval_steps_per_second": 9.233, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.668571949005127, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0475, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15184400975704193, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8353413654618473, |
|
"eval_overall_precision": 0.78, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3285, |
|
"eval_samples_per_second": 569.263, |
|
"eval_steps_per_second": 9.133, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 1.2341712713241577, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0491, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.8133333333333335, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7837837837837838, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6987951807228916, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14618448913097382, |
|
"eval_overall_accuracy": 0.9629000969932104, |
|
"eval_overall_f1": 0.8389715832205683, |
|
"eval_overall_precision": 0.7908163265306123, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3272, |
|
"eval_samples_per_second": 571.603, |
|
"eval_steps_per_second": 9.17, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.7431372404098511, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0462, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.7848101265822784, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7126436781609196, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7733333333333333, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6904761904761905, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1648775339126587, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8269484808454426, |
|
"eval_overall_precision": 0.7634146341463415, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3274, |
|
"eval_samples_per_second": 571.19, |
|
"eval_steps_per_second": 9.163, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.7144307494163513, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.046, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7712418300653594, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6704545454545454, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1596042811870575, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8308921438082557, |
|
"eval_overall_precision": 0.7722772277227723, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3254, |
|
"eval_samples_per_second": 574.71, |
|
"eval_steps_per_second": 9.22, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.5636935830116272, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0453, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1584891676902771, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8315508021390374, |
|
"eval_overall_precision": 0.7755610972568578, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3271, |
|
"eval_samples_per_second": 571.735, |
|
"eval_steps_per_second": 9.172, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 0.8465162515640259, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0467, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8996763754045306, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1548159122467041, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8322147651006712, |
|
"eval_overall_precision": 0.7788944723618091, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3278, |
|
"eval_samples_per_second": 570.444, |
|
"eval_steps_per_second": 9.152, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 1.0343018770217896, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0443, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.823529411764706, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7368421052631579, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6436781609195402, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9025974025974027, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.879746835443038, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15346647799015045, |
|
"eval_overall_accuracy": 0.9616876818622696, |
|
"eval_overall_f1": 0.8348993288590604, |
|
"eval_overall_precision": 0.7814070351758794, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3271, |
|
"eval_samples_per_second": 571.622, |
|
"eval_steps_per_second": 9.17, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.05382401496171951, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0447, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7814569536423841, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.686046511627907, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.16000644862651825, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8467741935483871, |
|
"eval_overall_precision": 0.7934508816120907, |
|
"eval_overall_recall": 0.9077809798270894, |
|
"eval_runtime": 0.326, |
|
"eval_samples_per_second": 573.613, |
|
"eval_steps_per_second": 9.202, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 9.811291694641113, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0441, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7808219178082192, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.7037037037037037, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.8055555555555556, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7435897435897436, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15801285207271576, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8371467025572005, |
|
"eval_overall_precision": 0.7853535353535354, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.328, |
|
"eval_samples_per_second": 570.116, |
|
"eval_steps_per_second": 9.146, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 1.3943322896957397, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0438, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7785234899328859, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6904761904761905, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15934574604034424, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8387096774193548, |
|
"eval_overall_precision": 0.7858942065491183, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3262, |
|
"eval_samples_per_second": 573.317, |
|
"eval_steps_per_second": 9.198, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.6321301460266113, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0449, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.7843137254901961, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7651006711409396, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6785714285714286, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15974144637584686, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8367071524966262, |
|
"eval_overall_precision": 0.7868020304568528, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3286, |
|
"eval_samples_per_second": 569.091, |
|
"eval_steps_per_second": 9.13, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.5539495348930359, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0436, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7785234899328859, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6904761904761905, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16229036450386047, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8421052631578949, |
|
"eval_overall_precision": 0.7918781725888325, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3259, |
|
"eval_samples_per_second": 573.851, |
|
"eval_steps_per_second": 9.206, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 3.007709503173828, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0434, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7581699346405228, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6590909090909091, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1612003743648529, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.835781041388518, |
|
"eval_overall_precision": 0.7786069651741293, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3275, |
|
"eval_samples_per_second": 571.067, |
|
"eval_steps_per_second": 9.162, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 1.6446222066879272, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0428, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7586206896551724, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15457752346992493, |
|
"eval_overall_accuracy": 0.9616876818622696, |
|
"eval_overall_f1": 0.8401084010840109, |
|
"eval_overall_precision": 0.7928388746803069, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3262, |
|
"eval_samples_per_second": 573.188, |
|
"eval_steps_per_second": 9.196, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.6172337532043457, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.043, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.76, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6705882352941176, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16485904157161713, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8344549125168236, |
|
"eval_overall_precision": 0.7828282828282829, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3271, |
|
"eval_samples_per_second": 571.666, |
|
"eval_steps_per_second": 9.171, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.48714974522590637, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0451, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7755102040816327, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6951219512195121, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15948227047920227, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8421052631578949, |
|
"eval_overall_precision": 0.7918781725888325, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3279, |
|
"eval_samples_per_second": 570.348, |
|
"eval_steps_per_second": 9.15, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.8867198824882507, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0444, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7682119205298013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6744186046511628, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16462980210781097, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8413978494623656, |
|
"eval_overall_precision": 0.7884130982367759, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3281, |
|
"eval_samples_per_second": 569.983, |
|
"eval_steps_per_second": 9.144, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.4750601649284363, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0406, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7702702702702702, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6867469879518072, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9096774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.88125, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15999138355255127, |
|
"eval_overall_accuracy": 0.9619301648884578, |
|
"eval_overall_f1": 0.8432432432432433, |
|
"eval_overall_precision": 0.7938931297709924, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3277, |
|
"eval_samples_per_second": 570.57, |
|
"eval_steps_per_second": 9.154, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.6775397658348083, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0415, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7785234899328859, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6904761904761905, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16279393434524536, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8413978494623656, |
|
"eval_overall_precision": 0.7884130982367759, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3261, |
|
"eval_samples_per_second": 573.372, |
|
"eval_steps_per_second": 9.198, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 0.4834389090538025, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0407, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7682119205298013, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6744186046511628, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9061488673139159, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8805031446540881, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1641407161951065, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8409703504043127, |
|
"eval_overall_precision": 0.789873417721519, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.15, |
|
"eval_steps_per_second": 9.179, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 3.0661368370056152, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0426, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7733333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6823529411764706, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9067524115755627, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1607460379600525, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8413978494623656, |
|
"eval_overall_precision": 0.7884130982367759, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3275, |
|
"eval_samples_per_second": 571.022, |
|
"eval_steps_per_second": 9.161, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.5167478919029236, |
|
"learning_rate": 5e-06, |
|
"loss": 0.041, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7837837837837838, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6987951807228916, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16166909039020538, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8421052631578949, |
|
"eval_overall_precision": 0.7918781725888325, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3276, |
|
"eval_samples_per_second": 570.818, |
|
"eval_steps_per_second": 9.158, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.6979191303253174, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0406, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16465260088443756, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8375838926174496, |
|
"eval_overall_precision": 0.7839195979899497, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.184, |
|
"eval_steps_per_second": 9.179, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.35358938574790955, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0408, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7702702702702702, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6867469879518072, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9067524115755627, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15703369677066803, |
|
"eval_overall_accuracy": 0.962172647914646, |
|
"eval_overall_f1": 0.8394062078272604, |
|
"eval_overall_precision": 0.7893401015228426, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.285, |
|
"eval_steps_per_second": 9.165, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.4786812365055084, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0411, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9067524115755627, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1660545915365219, |
|
"eval_overall_accuracy": 0.960717749757517, |
|
"eval_overall_f1": 0.8380187416331996, |
|
"eval_overall_precision": 0.7825, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.328, |
|
"eval_samples_per_second": 570.159, |
|
"eval_steps_per_second": 9.147, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.8427369594573975, |
|
"learning_rate": 3e-06, |
|
"loss": 0.04, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16458158195018768, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8375838926174496, |
|
"eval_overall_precision": 0.7839195979899497, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.327, |
|
"eval_samples_per_second": 571.854, |
|
"eval_steps_per_second": 9.174, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 1.0689115524291992, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0372, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9067524115755627, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16513913869857788, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8380187416331996, |
|
"eval_overall_precision": 0.7825, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3273, |
|
"eval_samples_per_second": 571.379, |
|
"eval_steps_per_second": 9.167, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.6339386105537415, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0393, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1637803018093109, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8353413654618473, |
|
"eval_overall_precision": 0.78, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3261, |
|
"eval_samples_per_second": 573.445, |
|
"eval_steps_per_second": 9.2, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.6922338604927063, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0396, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16408979892730713, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8375838926174496, |
|
"eval_overall_precision": 0.7839195979899497, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3277, |
|
"eval_samples_per_second": 570.597, |
|
"eval_steps_per_second": 9.154, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 1.161203384399414, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0385, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1643643081188202, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8375838926174496, |
|
"eval_overall_precision": 0.7839195979899497, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3284, |
|
"eval_samples_per_second": 569.344, |
|
"eval_steps_per_second": 9.134, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.5302362442016602, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0382, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1647883802652359, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8375838926174496, |
|
"eval_overall_precision": 0.7839195979899497, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3268, |
|
"eval_samples_per_second": 572.201, |
|
"eval_steps_per_second": 9.18, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.16222168505191803, |
|
"learning_rate": 0.0, |
|
"loss": 0.0411, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7631578947368421, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.16485615074634552, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8375838926174496, |
|
"eval_overall_precision": 0.7839195979899497, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3263, |
|
"eval_samples_per_second": 573.127, |
|
"eval_steps_per_second": 9.195, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 5123217774191952.0, |
|
"train_loss": 0.08768324019773951, |
|
"train_runtime": 561.3026, |
|
"train_samples_per_second": 300.729, |
|
"train_steps_per_second": 18.885 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 5123217774191952.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|