|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 1.0955079793930054, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9897, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.03508771929824561, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.16666666666666666, |
|
"eval_PERSON_recall": 0.0196078431372549, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.5791746973991394, |
|
"eval_overall_accuracy": 0.8382462224424078, |
|
"eval_overall_f1": 0.016172506738544475, |
|
"eval_overall_precision": 0.12, |
|
"eval_overall_recall": 0.008670520231213872, |
|
"eval_runtime": 0.9785, |
|
"eval_samples_per_second": 191.103, |
|
"eval_steps_per_second": 3.066, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.0362498760223389, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.4994, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.2391304347826087, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.4782608695652174, |
|
"eval_LOCATION_recall": 0.15942028985507245, |
|
"eval_ORGANIZATION_f1": 0.022727272727272728, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.037037037037037035, |
|
"eval_ORGANIZATION_recall": 0.01639344262295082, |
|
"eval_PERSON_f1": 0.6062176165803108, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.5021459227467812, |
|
"eval_PERSON_recall": 0.7647058823529411, |
|
"eval_QUANTITY_f1": 0.12000000000000002, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.16666666666666666, |
|
"eval_QUANTITY_recall": 0.09375, |
|
"eval_TIME_f1": 0.4848484848484849, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.45714285714285713, |
|
"eval_TIME_recall": 0.5161290322580645, |
|
"eval_loss": 0.3509860038757324, |
|
"eval_overall_accuracy": 0.8962100569729997, |
|
"eval_overall_f1": 0.43401759530791784, |
|
"eval_overall_precision": 0.44047619047619047, |
|
"eval_overall_recall": 0.4277456647398844, |
|
"eval_runtime": 1.0238, |
|
"eval_samples_per_second": 182.658, |
|
"eval_steps_per_second": 2.93, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.2612115144729614, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.3081, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.6883116883116883, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6235294117647059, |
|
"eval_LOCATION_recall": 0.7681159420289855, |
|
"eval_ORGANIZATION_f1": 0.39436619718309857, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.345679012345679, |
|
"eval_ORGANIZATION_recall": 0.45901639344262296, |
|
"eval_PERSON_f1": 0.8369230769230769, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.7906976744186046, |
|
"eval_PERSON_recall": 0.8888888888888888, |
|
"eval_QUANTITY_f1": 0.6111111111111112, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.55, |
|
"eval_QUANTITY_recall": 0.6875, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.20474210381507874, |
|
"eval_overall_accuracy": 0.9380728263562051, |
|
"eval_overall_f1": 0.6982872200263505, |
|
"eval_overall_precision": 0.6416464891041163, |
|
"eval_overall_recall": 0.7658959537572254, |
|
"eval_runtime": 1.0378, |
|
"eval_samples_per_second": 180.184, |
|
"eval_steps_per_second": 2.891, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 0.8938269019126892, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2123, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.6826347305389221, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.5816326530612245, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.5801526717557252, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5428571428571428, |
|
"eval_ORGANIZATION_recall": 0.6229508196721312, |
|
"eval_PERSON_f1": 0.8562874251497005, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.7900552486187845, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.6046511627906976, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.48148148148148145, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.72, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.6136363636363636, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.18629486858844757, |
|
"eval_overall_accuracy": 0.9400544959128065, |
|
"eval_overall_f1": 0.7339218158890289, |
|
"eval_overall_precision": 0.6510067114093959, |
|
"eval_overall_recall": 0.8410404624277457, |
|
"eval_runtime": 0.994, |
|
"eval_samples_per_second": 188.123, |
|
"eval_steps_per_second": 3.018, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.1821776628494263, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.1737, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.7417218543046358, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6829268292682927, |
|
"eval_LOCATION_recall": 0.8115942028985508, |
|
"eval_ORGANIZATION_f1": 0.6474820143884893, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5769230769230769, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.8693009118541033, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8125, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.6478873239436619, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.71875, |
|
"eval_TIME_f1": 0.8615384615384616, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8235294117647058, |
|
"eval_TIME_recall": 0.9032258064516129, |
|
"eval_loss": 0.14358247816562653, |
|
"eval_overall_accuracy": 0.9524399306415655, |
|
"eval_overall_f1": 0.7814569536423841, |
|
"eval_overall_precision": 0.7212713936430318, |
|
"eval_overall_recall": 0.8526011560693642, |
|
"eval_runtime": 0.9687, |
|
"eval_samples_per_second": 193.04, |
|
"eval_steps_per_second": 3.097, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 0.5935459733009338, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1547, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7388535031847134, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6590909090909091, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5617977528089888, |
|
"eval_ORGANIZATION_recall": 0.819672131147541, |
|
"eval_PERSON_f1": 0.8827160493827161, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8362573099415205, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.684931506849315, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6097560975609756, |
|
"eval_QUANTITY_recall": 0.78125, |
|
"eval_TIME_f1": 0.7714285714285716, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.6923076923076923, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.143008753657341, |
|
"eval_overall_accuracy": 0.953183056725291, |
|
"eval_overall_f1": 0.7829457364341086, |
|
"eval_overall_precision": 0.7079439252336449, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9772, |
|
"eval_samples_per_second": 191.367, |
|
"eval_steps_per_second": 3.07, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 0.4739581048488617, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1434, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7142857142857144, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6470588235294118, |
|
"eval_LOCATION_recall": 0.7971014492753623, |
|
"eval_ORGANIZATION_f1": 0.6715328467153285, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6052631578947368, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8800000000000001, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8313953488372093, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.6923076923076924, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.5869565217391305, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8059701492537312, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.14124642312526703, |
|
"eval_overall_accuracy": 0.9529353480307159, |
|
"eval_overall_f1": 0.7831800262812089, |
|
"eval_overall_precision": 0.7180722891566265, |
|
"eval_overall_recall": 0.861271676300578, |
|
"eval_runtime": 0.998, |
|
"eval_samples_per_second": 187.368, |
|
"eval_steps_per_second": 3.006, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.6086934208869934, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1316, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6577181208053691, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5568181818181818, |
|
"eval_ORGANIZATION_recall": 0.8032786885245902, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.6944444444444444, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.78125, |
|
"eval_TIME_f1": 0.7323943661971831, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.65, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.13939833641052246, |
|
"eval_overall_accuracy": 0.9546693088927422, |
|
"eval_overall_f1": 0.7931488801054017, |
|
"eval_overall_precision": 0.7288135593220338, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 1.0022, |
|
"eval_samples_per_second": 186.59, |
|
"eval_steps_per_second": 2.993, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.063918113708496, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1279, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.763157894736842, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6987951807228916, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6518518518518518, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5945945945945946, |
|
"eval_ORGANIZATION_recall": 0.7213114754098361, |
|
"eval_PERSON_f1": 0.897196261682243, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7397260273972602, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7222222222222222, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.6341463414634146, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.13130132853984833, |
|
"eval_overall_accuracy": 0.9564032697547684, |
|
"eval_overall_f1": 0.7941567065073042, |
|
"eval_overall_precision": 0.7346437346437347, |
|
"eval_overall_recall": 0.8641618497109826, |
|
"eval_runtime": 1.0067, |
|
"eval_samples_per_second": 185.75, |
|
"eval_steps_per_second": 2.98, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 0.9094120860099792, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1211, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7702702702702703, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7215189873417721, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.6259541984732824, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5857142857142857, |
|
"eval_ORGANIZATION_recall": 0.6721311475409836, |
|
"eval_PERSON_f1": 0.9148264984227129, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8841463414634146, |
|
"eval_PERSON_recall": 0.9477124183006536, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8059701492537312, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.12145308405160904, |
|
"eval_overall_accuracy": 0.9616051523408472, |
|
"eval_overall_f1": 0.8109589041095892, |
|
"eval_overall_precision": 0.7708333333333334, |
|
"eval_overall_recall": 0.8554913294797688, |
|
"eval_runtime": 0.9852, |
|
"eval_samples_per_second": 189.802, |
|
"eval_steps_per_second": 3.045, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.7485252022743225, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.114, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7549668874172186, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6951219512195121, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.6527777777777777, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5662650602409639, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.896551724137931, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8614457831325302, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7123287671232876, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6341463414634146, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1312883496284485, |
|
"eval_overall_accuracy": 0.9571463958384939, |
|
"eval_overall_f1": 0.7941567065073042, |
|
"eval_overall_precision": 0.7346437346437347, |
|
"eval_overall_recall": 0.8641618497109826, |
|
"eval_runtime": 0.9834, |
|
"eval_samples_per_second": 190.157, |
|
"eval_steps_per_second": 3.051, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.104870080947876, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1087, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6969696969696969, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.647887323943662, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9022082018927446, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7105263157894737, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8307692307692308, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7941176470588235, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.13906444609165192, |
|
"eval_overall_accuracy": 0.9561555610601932, |
|
"eval_overall_f1": 0.8146143437077131, |
|
"eval_overall_precision": 0.7659033078880407, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9902, |
|
"eval_samples_per_second": 188.851, |
|
"eval_steps_per_second": 3.03, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.6125289797782898, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1042, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.8163265306122449, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6811594202898551, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6103896103896104, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7714285714285714, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.13031348586082458, |
|
"eval_overall_accuracy": 0.9606143175625464, |
|
"eval_overall_f1": 0.8211382113821138, |
|
"eval_overall_precision": 0.7729591836734694, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9889, |
|
"eval_samples_per_second": 189.1, |
|
"eval_steps_per_second": 3.034, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 2.0589206218719482, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1018, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.7945205479452054, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7532467532467533, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6911764705882353, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6266666666666667, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.9056603773584905, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7012987012987012, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7428571428571428, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.14253932237625122, |
|
"eval_overall_accuracy": 0.9561555610601932, |
|
"eval_overall_f1": 0.8085676037483266, |
|
"eval_overall_precision": 0.7531172069825436, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9977, |
|
"eval_samples_per_second": 187.428, |
|
"eval_steps_per_second": 3.007, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 0.1841476559638977, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.0973, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.7919463087248322, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7375, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6115702479338844, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6166666666666667, |
|
"eval_ORGANIZATION_recall": 0.6065573770491803, |
|
"eval_PERSON_f1": 0.8987341772151898, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7826086956521738, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.875, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8484848484848485, |
|
"eval_TIME_recall": 0.9032258064516129, |
|
"eval_loss": 0.1355912983417511, |
|
"eval_overall_accuracy": 0.9581372306167947, |
|
"eval_overall_f1": 0.8150208623087621, |
|
"eval_overall_precision": 0.7855227882037533, |
|
"eval_overall_recall": 0.846820809248555, |
|
"eval_runtime": 0.9803, |
|
"eval_samples_per_second": 190.757, |
|
"eval_steps_per_second": 3.06, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 0.4039229452610016, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.0931, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.7549668874172186, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6951219512195121, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.6808510638297871, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7868852459016393, |
|
"eval_PERSON_f1": 0.9028213166144202, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8674698795180723, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7647058823529411, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.84375, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8181818181818182, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.1370057314634323, |
|
"eval_overall_accuracy": 0.9591280653950953, |
|
"eval_overall_f1": 0.8129205921938087, |
|
"eval_overall_precision": 0.760705289672544, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 1.0534, |
|
"eval_samples_per_second": 177.517, |
|
"eval_steps_per_second": 2.848, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.39411261677742004, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0925, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.8026315789473685, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6621621621621622, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5632183908045977, |
|
"eval_ORGANIZATION_recall": 0.8032786885245902, |
|
"eval_PERSON_f1": 0.896551724137931, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8614457831325302, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7397260273972602, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7428571428571428, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1501362919807434, |
|
"eval_overall_accuracy": 0.9529353480307159, |
|
"eval_overall_f1": 0.8031496062992126, |
|
"eval_overall_precision": 0.7355769230769231, |
|
"eval_overall_recall": 0.884393063583815, |
|
"eval_runtime": 0.9811, |
|
"eval_samples_per_second": 190.602, |
|
"eval_steps_per_second": 3.058, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.6146470308303833, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0885, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8299319727891156, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.782051282051282, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6451612903225806, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6349206349206349, |
|
"eval_ORGANIZATION_recall": 0.6557377049180327, |
|
"eval_PERSON_f1": 0.8987341772151898, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.742857142857143, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.84375, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8181818181818182, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.12835608422756195, |
|
"eval_overall_accuracy": 0.9596234827842457, |
|
"eval_overall_f1": 0.8210818307905687, |
|
"eval_overall_precision": 0.7893333333333333, |
|
"eval_overall_recall": 0.8554913294797688, |
|
"eval_runtime": 0.9954, |
|
"eval_samples_per_second": 187.858, |
|
"eval_steps_per_second": 3.014, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.8693987131118774, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.088, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8243243243243245, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6716417910447762, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6164383561643836, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9022082018927446, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7323943661971831, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.84375, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8181818181818182, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.12790969014167786, |
|
"eval_overall_accuracy": 0.9621005697299975, |
|
"eval_overall_f1": 0.8228882833787465, |
|
"eval_overall_precision": 0.7783505154639175, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 1.0031, |
|
"eval_samples_per_second": 186.424, |
|
"eval_steps_per_second": 2.991, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.5405162572860718, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0786, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.704225352112676, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6172839506172839, |
|
"eval_ORGANIZATION_recall": 0.819672131147541, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7323943661971831, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7761194029850746, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1476246416568756, |
|
"eval_overall_accuracy": 0.9571463958384939, |
|
"eval_overall_f1": 0.8170894526034712, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.884393063583815, |
|
"eval_runtime": 1.0147, |
|
"eval_samples_per_second": 184.289, |
|
"eval_steps_per_second": 2.957, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 0.5259639620780945, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0776, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.7866666666666667, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6617647058823529, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.8944099378881987, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8520710059171598, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.742857142857143, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8307692307692308, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7941176470588235, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.1557183563709259, |
|
"eval_overall_accuracy": 0.955907852365618, |
|
"eval_overall_f1": 0.8102288021534321, |
|
"eval_overall_precision": 0.7581863979848866, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9938, |
|
"eval_samples_per_second": 188.167, |
|
"eval_steps_per_second": 3.019, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.4461101293563843, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0789, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.7808219178082192, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7402597402597403, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.6086956521739131, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.49, |
|
"eval_ORGANIZATION_recall": 0.8032786885245902, |
|
"eval_PERSON_f1": 0.9022082018927446, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7761194029850746, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1589283049106598, |
|
"eval_overall_accuracy": 0.9497151350012385, |
|
"eval_overall_f1": 0.7941952506596306, |
|
"eval_overall_precision": 0.7305825242718447, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.993, |
|
"eval_samples_per_second": 188.313, |
|
"eval_steps_per_second": 3.021, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 1.1329030990600586, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.079, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.7702702702702703, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7215189873417721, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.6818181818181818, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6338028169014085, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9113924050632911, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8834355828220859, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7222222222222223, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.13774369657039642, |
|
"eval_overall_accuracy": 0.9593757740896706, |
|
"eval_overall_f1": 0.8119891008174387, |
|
"eval_overall_precision": 0.7680412371134021, |
|
"eval_overall_recall": 0.861271676300578, |
|
"eval_runtime": 0.98, |
|
"eval_samples_per_second": 190.819, |
|
"eval_steps_per_second": 3.061, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.0383950471878052, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0728, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7631578947368421, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6811594202898551, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6103896103896104, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.9085173501577287, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8780487804878049, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.8, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7878787878787878, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8181818181818182, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7714285714285715, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.13363541662693024, |
|
"eval_overall_accuracy": 0.9608620262571216, |
|
"eval_overall_f1": 0.8262653898768809, |
|
"eval_overall_precision": 0.7844155844155845, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 1.005, |
|
"eval_samples_per_second": 186.066, |
|
"eval_steps_per_second": 2.985, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.8166852593421936, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.071, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.7272727272727274, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6588235294117647, |
|
"eval_LOCATION_recall": 0.8115942028985508, |
|
"eval_ORGANIZATION_f1": 0.6623376623376623, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5483870967741935, |
|
"eval_ORGANIZATION_recall": 0.8360655737704918, |
|
"eval_PERSON_f1": 0.9028213166144202, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8674698795180723, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7222222222222223, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7761194029850746, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.15092754364013672, |
|
"eval_overall_accuracy": 0.9539261828090166, |
|
"eval_overall_f1": 0.7911227154046997, |
|
"eval_overall_precision": 0.7214285714285714, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9891, |
|
"eval_samples_per_second": 189.065, |
|
"eval_steps_per_second": 3.033, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.8139777183532715, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.072, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.7733333333333333, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.689655172413793, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5952380952380952, |
|
"eval_ORGANIZATION_recall": 0.819672131147541, |
|
"eval_PERSON_f1": 0.9113924050632911, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8834355828220859, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.6756756756756757, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.5952380952380952, |
|
"eval_QUANTITY_recall": 0.78125, |
|
"eval_TIME_f1": 0.7647058823529411, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7027027027027027, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1510118842124939, |
|
"eval_overall_accuracy": 0.9549170175873173, |
|
"eval_overall_f1": 0.804780876494024, |
|
"eval_overall_precision": 0.7444717444717445, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9975, |
|
"eval_samples_per_second": 187.468, |
|
"eval_steps_per_second": 3.008, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.325568825006485, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.068, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.7837837837837838, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7341772151898734, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.896551724137931, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8614457831325302, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8059701492537312, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.14145956933498383, |
|
"eval_overall_accuracy": 0.958632648005945, |
|
"eval_overall_f1": 0.8130081300813009, |
|
"eval_overall_precision": 0.7653061224489796, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 0.9961, |
|
"eval_samples_per_second": 187.728, |
|
"eval_steps_per_second": 3.012, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 0.9541507363319397, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0668, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.7755102040816326, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7307692307692307, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.6818181818181818, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6338028169014085, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9085173501577287, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8780487804878049, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7647058823529411, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7536231884057972, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.6842105263157895, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1411270946264267, |
|
"eval_overall_accuracy": 0.9598711914788209, |
|
"eval_overall_f1": 0.8130968622100955, |
|
"eval_overall_precision": 0.7700258397932817, |
|
"eval_overall_recall": 0.861271676300578, |
|
"eval_runtime": 0.9842, |
|
"eval_samples_per_second": 190.009, |
|
"eval_steps_per_second": 3.048, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.8704339265823364, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0675, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6944444444444445, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6024096385542169, |
|
"eval_ORGANIZATION_recall": 0.819672131147541, |
|
"eval_PERSON_f1": 0.9022082018927446, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8064516129032258, |
|
"eval_loss": 0.14205148816108704, |
|
"eval_overall_accuracy": 0.9608620262571216, |
|
"eval_overall_f1": 0.8243243243243245, |
|
"eval_overall_precision": 0.7741116751269036, |
|
"eval_overall_recall": 0.8815028901734104, |
|
"eval_runtime": 1.078, |
|
"eval_samples_per_second": 173.471, |
|
"eval_steps_per_second": 2.783, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.5594027042388916, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.065, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.7581699346405228, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6904761904761905, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5974025974025974, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8622754491017964, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.742857142857143, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1492728590965271, |
|
"eval_overall_accuracy": 0.9583849393113698, |
|
"eval_overall_f1": 0.804289544235925, |
|
"eval_overall_precision": 0.75, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 0.9945, |
|
"eval_samples_per_second": 188.028, |
|
"eval_steps_per_second": 3.016, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.3202365040779114, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0649, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.7837837837837838, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7341772151898734, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6865671641791045, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6301369863013698, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9044585987261147, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8819875776397516, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.84375, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8181818181818182, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.1405114084482193, |
|
"eval_overall_accuracy": 0.9611097349516968, |
|
"eval_overall_f1": 0.8225584594222832, |
|
"eval_overall_precision": 0.7847769028871391, |
|
"eval_overall_recall": 0.8641618497109826, |
|
"eval_runtime": 0.9891, |
|
"eval_samples_per_second": 189.058, |
|
"eval_steps_per_second": 3.033, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.534267783164978, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0602, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.8187919463087248, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6865671641791045, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6301369863013698, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8958990536277602, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.875, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8484848484848485, |
|
"eval_TIME_recall": 0.9032258064516129, |
|
"eval_loss": 0.13280674815177917, |
|
"eval_overall_accuracy": 0.9628436958137231, |
|
"eval_overall_f1": 0.8290013679890561, |
|
"eval_overall_precision": 0.787012987012987, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9944, |
|
"eval_samples_per_second": 188.059, |
|
"eval_steps_per_second": 3.017, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.28801554441452026, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0617, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.7891156462585034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7435897435897436, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6818181818181818, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6338028169014085, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9015873015873016, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8765432098765432, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1359180212020874, |
|
"eval_overall_accuracy": 0.9603666088679713, |
|
"eval_overall_f1": 0.8170563961485556, |
|
"eval_overall_precision": 0.7795275590551181, |
|
"eval_overall_recall": 0.8583815028901735, |
|
"eval_runtime": 0.9982, |
|
"eval_samples_per_second": 187.341, |
|
"eval_steps_per_second": 3.005, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 0.6007792949676514, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0592, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.7483870967741935, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6744186046511628, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6754966887417219, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5666666666666667, |
|
"eval_ORGANIZATION_recall": 0.8360655737704918, |
|
"eval_PERSON_f1": 0.9125, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.874251497005988, |
|
"eval_PERSON_recall": 0.954248366013072, |
|
"eval_QUANTITY_f1": 0.6933333333333334, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6046511627906976, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7222222222222222, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.6341463414634146, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.17786887288093567, |
|
"eval_overall_accuracy": 0.9512013871686896, |
|
"eval_overall_f1": 0.794307891332471, |
|
"eval_overall_precision": 0.7189695550351288, |
|
"eval_overall_recall": 0.8872832369942196, |
|
"eval_runtime": 1.0067, |
|
"eval_samples_per_second": 185.754, |
|
"eval_steps_per_second": 2.98, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 1.0059374570846558, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0572, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.7866666666666667, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6762589928057554, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6025641025641025, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.8980891719745223, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.7647058823529411, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.14642970263957977, |
|
"eval_overall_accuracy": 0.9591280653950953, |
|
"eval_overall_f1": 0.815825375170532, |
|
"eval_overall_precision": 0.772609819121447, |
|
"eval_overall_recall": 0.8641618497109826, |
|
"eval_runtime": 0.9961, |
|
"eval_samples_per_second": 187.738, |
|
"eval_steps_per_second": 3.012, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.9360735416412354, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0569, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.7972972972972974, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6618705035971222, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5897435897435898, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9211356466876972, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8902439024390244, |
|
"eval_PERSON_recall": 0.954248366013072, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.14345212280750275, |
|
"eval_overall_accuracy": 0.9618528610354223, |
|
"eval_overall_f1": 0.8278688524590163, |
|
"eval_overall_precision": 0.7849740932642487, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 1.0012, |
|
"eval_samples_per_second": 186.767, |
|
"eval_steps_per_second": 2.996, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 1.6939655542373657, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0573, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.8163265306122449, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6715328467153285, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6052631578947368, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8958990536277602, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.14684607088565826, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.8241758241758242, |
|
"eval_overall_precision": 0.7853403141361257, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 0.9892, |
|
"eval_samples_per_second": 189.05, |
|
"eval_steps_per_second": 3.033, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.7411573529243469, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0524, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.7866666666666667, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6714285714285714, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5949367088607594, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.89375, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8562874251497006, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7323943661971831, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.15702801942825317, |
|
"eval_overall_accuracy": 0.9576418132276443, |
|
"eval_overall_f1": 0.8058902275769746, |
|
"eval_overall_precision": 0.7506234413965087, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9832, |
|
"eval_samples_per_second": 190.205, |
|
"eval_steps_per_second": 3.051, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.9962830543518066, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0526, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.7947019867549668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.7014925373134328, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6438356164383562, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.9119496855345912, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8787878787878788, |
|
"eval_PERSON_recall": 0.9477124183006536, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.84375, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.14492842555046082, |
|
"eval_overall_accuracy": 0.9623482784245727, |
|
"eval_overall_f1": 0.8299319727891157, |
|
"eval_overall_precision": 0.7840616966580977, |
|
"eval_overall_recall": 0.8815028901734104, |
|
"eval_runtime": 0.9833, |
|
"eval_samples_per_second": 190.175, |
|
"eval_steps_per_second": 3.051, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.8109886050224304, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0525, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9050632911392406, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8773006134969326, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8181818181818182, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7714285714285715, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.15133674442768097, |
|
"eval_overall_accuracy": 0.9603666088679713, |
|
"eval_overall_f1": 0.8201634877384196, |
|
"eval_overall_precision": 0.7757731958762887, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9893, |
|
"eval_samples_per_second": 189.014, |
|
"eval_steps_per_second": 3.032, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.10324083268642426, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0511, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.7843137254901961, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6081081081081081, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.909657320872274, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8690476190476191, |
|
"eval_PERSON_recall": 0.954248366013072, |
|
"eval_QUANTITY_f1": 0.7647058823529411, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.157461017370224, |
|
"eval_overall_accuracy": 0.9588803567005202, |
|
"eval_overall_f1": 0.8167115902964959, |
|
"eval_overall_precision": 0.7651515151515151, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9754, |
|
"eval_samples_per_second": 191.721, |
|
"eval_steps_per_second": 3.076, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 1.2128788232803345, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0528, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.7733333333333333, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6619718309859155, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5802469135802469, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.915360501567398, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8795180722891566, |
|
"eval_PERSON_recall": 0.954248366013072, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.84375, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8181818181818182, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.1547376662492752, |
|
"eval_overall_accuracy": 0.9593757740896706, |
|
"eval_overall_f1": 0.8172043010752688, |
|
"eval_overall_precision": 0.7638190954773869, |
|
"eval_overall_recall": 0.8786127167630058, |
|
"eval_runtime": 1.0757, |
|
"eval_samples_per_second": 173.839, |
|
"eval_steps_per_second": 2.789, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.1244686096906662, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0499, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.7837837837837838, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7341772151898734, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.7014925373134328, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6438356164383562, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.8987341772151898, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.742857142857143, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8253968253968254, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.15334224700927734, |
|
"eval_overall_accuracy": 0.9588803567005202, |
|
"eval_overall_f1": 0.8180574555403556, |
|
"eval_overall_precision": 0.7766233766233767, |
|
"eval_overall_recall": 0.8641618497109826, |
|
"eval_runtime": 1.1556, |
|
"eval_samples_per_second": 161.821, |
|
"eval_steps_per_second": 2.596, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 1.083632230758667, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0471, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6917293233082706, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6388888888888888, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9028213166144202, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8674698795180723, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7647058823529411, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7761194029850746, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1608462631702423, |
|
"eval_overall_accuracy": 0.9591280653950953, |
|
"eval_overall_f1": 0.8211382113821138, |
|
"eval_overall_precision": 0.7729591836734694, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 1.0042, |
|
"eval_samples_per_second": 186.211, |
|
"eval_steps_per_second": 2.987, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 0.6506208181381226, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0459, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8053691275167786, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6865671641791045, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6301369863013698, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8819875776397514, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8402366863905325, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.742857142857143, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.15545788407325745, |
|
"eval_overall_accuracy": 0.9581372306167947, |
|
"eval_overall_f1": 0.8097165991902835, |
|
"eval_overall_precision": 0.759493670886076, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 0.9925, |
|
"eval_samples_per_second": 188.407, |
|
"eval_steps_per_second": 3.023, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.6165773272514343, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0459, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.7549668874172186, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6951219512195121, |
|
"eval_LOCATION_recall": 0.8260869565217391, |
|
"eval_ORGANIZATION_f1": 0.6616541353383459, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6111111111111112, |
|
"eval_ORGANIZATION_recall": 0.7213114754098361, |
|
"eval_PERSON_f1": 0.8902821316614421, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8554216867469879, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8253968253968254, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.166278675198555, |
|
"eval_overall_accuracy": 0.9571463958384939, |
|
"eval_overall_f1": 0.8027210884353743, |
|
"eval_overall_precision": 0.7583547557840618, |
|
"eval_overall_recall": 0.8526011560693642, |
|
"eval_runtime": 0.9964, |
|
"eval_samples_per_second": 187.678, |
|
"eval_steps_per_second": 3.011, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 1.6443135738372803, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0457, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8053691275167786, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.671875, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7049180327868853, |
|
"eval_PERSON_f1": 0.8847352024922119, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8452380952380952, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.9180327868852459, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.9333333333333333, |
|
"eval_TIME_recall": 0.9032258064516129, |
|
"eval_loss": 0.15434302389621735, |
|
"eval_overall_accuracy": 0.9628436958137231, |
|
"eval_overall_f1": 0.8248275862068966, |
|
"eval_overall_precision": 0.7889182058047494, |
|
"eval_overall_recall": 0.8641618497109826, |
|
"eval_runtime": 1.0099, |
|
"eval_samples_per_second": 185.163, |
|
"eval_steps_per_second": 2.971, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 0.7369825839996338, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0442, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.7682119205298014, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7073170731707317, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6769230769230768, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6376811594202898, |
|
"eval_ORGANIZATION_recall": 0.7213114754098361, |
|
"eval_PERSON_f1": 0.9050632911392406, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8773006134969326, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7647058823529411, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.15800130367279053, |
|
"eval_overall_accuracy": 0.9598711914788209, |
|
"eval_overall_f1": 0.8125854993160055, |
|
"eval_overall_precision": 0.7714285714285715, |
|
"eval_overall_recall": 0.8583815028901735, |
|
"eval_runtime": 0.9849, |
|
"eval_samples_per_second": 189.872, |
|
"eval_steps_per_second": 3.046, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.5814737677574158, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0444, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8405797101449275, |
|
"eval_ORGANIZATION_f1": 0.6962962962962963, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6351351351351351, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.9085173501577287, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8780487804878049, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.15717627108097076, |
|
"eval_overall_accuracy": 0.9621005697299975, |
|
"eval_overall_f1": 0.8235294117647058, |
|
"eval_overall_precision": 0.7818181818181819, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.993, |
|
"eval_samples_per_second": 188.327, |
|
"eval_steps_per_second": 3.021, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 0.585141658782959, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0424, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8108108108108109, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.759493670886076, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6769230769230768, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6376811594202898, |
|
"eval_ORGANIZATION_recall": 0.7213114754098361, |
|
"eval_PERSON_f1": 0.8958990536277602, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8253968253968254, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.15228819847106934, |
|
"eval_overall_accuracy": 0.9621005697299975, |
|
"eval_overall_f1": 0.8232044198895027, |
|
"eval_overall_precision": 0.7883597883597884, |
|
"eval_overall_recall": 0.861271676300578, |
|
"eval_runtime": 0.9899, |
|
"eval_samples_per_second": 188.901, |
|
"eval_steps_per_second": 3.031, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.8279469013214111, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0411, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.8053691275167786, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6714285714285714, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5949367088607594, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.897196261682243, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.84375, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8181818181818182, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.15568019449710846, |
|
"eval_overall_accuracy": 0.9616051523408472, |
|
"eval_overall_f1": 0.8216216216216216, |
|
"eval_overall_precision": 0.7715736040609137, |
|
"eval_overall_recall": 0.8786127167630058, |
|
"eval_runtime": 0.9971, |
|
"eval_samples_per_second": 187.536, |
|
"eval_steps_per_second": 3.009, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.46233218908309937, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0424, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6811594202898551, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6103896103896104, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.9028213166144202, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8674698795180723, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.15841934084892273, |
|
"eval_overall_accuracy": 0.9616051523408472, |
|
"eval_overall_f1": 0.8227334235453315, |
|
"eval_overall_precision": 0.7735368956743003, |
|
"eval_overall_recall": 0.8786127167630058, |
|
"eval_runtime": 0.992, |
|
"eval_samples_per_second": 188.511, |
|
"eval_steps_per_second": 3.024, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.6373240351676941, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0408, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.8108108108108109, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.759493670886076, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6861313868613139, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.618421052631579, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.896551724137931, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8614457831325302, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8852459016393444, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.9, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.15928535163402557, |
|
"eval_overall_accuracy": 0.9618528610354223, |
|
"eval_overall_f1": 0.8278688524590163, |
|
"eval_overall_precision": 0.7849740932642487, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.989, |
|
"eval_samples_per_second": 189.088, |
|
"eval_steps_per_second": 3.034, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.2755186855792999, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0412, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.8053691275167786, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6962962962962963, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6351351351351351, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.896551724137931, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8614457831325302, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8253968253968254, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.158822163939476, |
|
"eval_overall_accuracy": 0.9630914045082982, |
|
"eval_overall_f1": 0.825136612021858, |
|
"eval_overall_precision": 0.7823834196891192, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9914, |
|
"eval_samples_per_second": 188.631, |
|
"eval_steps_per_second": 3.026, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 2.969045639038086, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0422, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6301369863013699, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5411764705882353, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8958990536277602, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8181818181818182, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7714285714285715, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.1669679880142212, |
|
"eval_overall_accuracy": 0.9596234827842457, |
|
"eval_overall_f1": 0.8080536912751678, |
|
"eval_overall_precision": 0.7543859649122807, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 1.0094, |
|
"eval_samples_per_second": 185.251, |
|
"eval_steps_per_second": 2.972, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 1.2709088325500488, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0393, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.821917808219178, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7792207792207793, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6917293233082706, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6388888888888888, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9022082018927446, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8064516129032258, |
|
"eval_loss": 0.15802454948425293, |
|
"eval_overall_accuracy": 0.9630914045082982, |
|
"eval_overall_f1": 0.8310249307479224, |
|
"eval_overall_precision": 0.7978723404255319, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 1.001, |
|
"eval_samples_per_second": 186.82, |
|
"eval_steps_per_second": 2.997, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.5410558581352234, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0397, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6616541353383459, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6111111111111112, |
|
"eval_ORGANIZATION_recall": 0.7213114754098361, |
|
"eval_PERSON_f1": 0.9085173501577287, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8780487804878049, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8307692307692308, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7941176470588235, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.16334755718708038, |
|
"eval_overall_accuracy": 0.9625959871191478, |
|
"eval_overall_f1": 0.8262653898768809, |
|
"eval_overall_precision": 0.7844155844155845, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 1.0636, |
|
"eval_samples_per_second": 175.822, |
|
"eval_steps_per_second": 2.821, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.09321507066488266, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0367, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6716417910447762, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6164383561643836, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.17088571190834045, |
|
"eval_overall_accuracy": 0.9608620262571216, |
|
"eval_overall_f1": 0.8212824010914053, |
|
"eval_overall_precision": 0.7777777777777778, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9854, |
|
"eval_samples_per_second": 189.767, |
|
"eval_steps_per_second": 3.044, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 0.659205973148346, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0384, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6376811594202898, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5714285714285714, |
|
"eval_ORGANIZATION_recall": 0.7213114754098361, |
|
"eval_PERSON_f1": 0.8987341772151898, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8059701492537312, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.17435206472873688, |
|
"eval_overall_accuracy": 0.9591280653950953, |
|
"eval_overall_f1": 0.8135135135135134, |
|
"eval_overall_precision": 0.7639593908629442, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9909, |
|
"eval_samples_per_second": 188.725, |
|
"eval_steps_per_second": 3.028, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.5503810048103333, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0383, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.7814569536423841, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7195121951219512, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6617647058823529, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8622754491017964, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8253968253968254, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1732153296470642, |
|
"eval_overall_accuracy": 0.9588803567005202, |
|
"eval_overall_f1": 0.814111261872456, |
|
"eval_overall_precision": 0.7672634271099744, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 0.9921, |
|
"eval_samples_per_second": 188.484, |
|
"eval_steps_per_second": 3.024, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.4769850969314575, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0336, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8163265306122449, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6917293233082706, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6388888888888888, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8958990536277602, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.8181818181818182, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7941176470588235, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8307692307692308, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7941176470588235, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.1649622768163681, |
|
"eval_overall_accuracy": 0.9633391132028735, |
|
"eval_overall_f1": 0.8296703296703297, |
|
"eval_overall_precision": 0.7905759162303665, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9878, |
|
"eval_samples_per_second": 189.311, |
|
"eval_steps_per_second": 3.037, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.4070124328136444, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0356, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.8026315789473685, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6521739130434783, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5844155844155844, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.897196261682243, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7826086956521738, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18611405789852142, |
|
"eval_overall_accuracy": 0.9568986871439188, |
|
"eval_overall_f1": 0.8123324396782842, |
|
"eval_overall_precision": 0.7575, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 1.0068, |
|
"eval_samples_per_second": 185.733, |
|
"eval_steps_per_second": 2.98, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.3907913863658905, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0344, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.8108108108108109, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.759493670886076, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6917293233082706, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6388888888888888, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9022082018927446, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1645907610654831, |
|
"eval_overall_accuracy": 0.9608620262571216, |
|
"eval_overall_f1": 0.8257887517146777, |
|
"eval_overall_precision": 0.7859007832898173, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9932, |
|
"eval_samples_per_second": 188.281, |
|
"eval_steps_per_second": 3.021, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.682833731174469, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0333, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8053691275167786, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6713286713286712, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5853658536585366, |
|
"eval_ORGANIZATION_recall": 0.7868852459016393, |
|
"eval_PERSON_f1": 0.9028213166144202, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8674698795180723, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7761194029850746, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.17704235017299652, |
|
"eval_overall_accuracy": 0.9593757740896706, |
|
"eval_overall_f1": 0.8172043010752688, |
|
"eval_overall_precision": 0.7638190954773869, |
|
"eval_overall_recall": 0.8786127167630058, |
|
"eval_runtime": 1.0021, |
|
"eval_samples_per_second": 186.614, |
|
"eval_steps_per_second": 2.994, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 0.3721832036972046, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0342, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6618705035971222, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5897435897435898, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9050632911392406, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8773006134969326, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1735246777534485, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.8222523744911805, |
|
"eval_overall_precision": 0.7749360613810742, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 1.0031, |
|
"eval_samples_per_second": 186.413, |
|
"eval_steps_per_second": 2.991, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.2796691954135895, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0341, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6617647058823529, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8622754491017964, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7647058823529411, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7027027027027027, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1770649254322052, |
|
"eval_overall_accuracy": 0.9606143175625464, |
|
"eval_overall_f1": 0.8178137651821862, |
|
"eval_overall_precision": 0.7670886075949367, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9965, |
|
"eval_samples_per_second": 187.651, |
|
"eval_steps_per_second": 3.01, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.8784322142601013, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0326, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.8053691275167786, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5974025974025974, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8930817610062893, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8606060606060606, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1722780466079712, |
|
"eval_overall_accuracy": 0.9593757740896706, |
|
"eval_overall_f1": 0.8157181571815717, |
|
"eval_overall_precision": 0.7678571428571429, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 1.0013, |
|
"eval_samples_per_second": 186.756, |
|
"eval_steps_per_second": 2.996, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.47935327887535095, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0347, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.656934306569343, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5921052631578947, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9056603773584905, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7761194029850746, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18066948652267456, |
|
"eval_overall_accuracy": 0.9583849393113698, |
|
"eval_overall_f1": 0.8162162162162162, |
|
"eval_overall_precision": 0.766497461928934, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9981, |
|
"eval_samples_per_second": 187.358, |
|
"eval_steps_per_second": 3.006, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.7104108333587646, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.033, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.7919463087248322, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7375, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.5875, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.9028213166144202, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8674698795180723, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1800457388162613, |
|
"eval_overall_accuracy": 0.9583849393113698, |
|
"eval_overall_f1": 0.8162162162162162, |
|
"eval_overall_precision": 0.766497461928934, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 1.0133, |
|
"eval_samples_per_second": 184.537, |
|
"eval_steps_per_second": 2.96, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 1.264423131942749, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.032, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6716417910447762, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6164383561643836, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9056603773584905, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.8181818181818182, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7941176470588235, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1743316799402237, |
|
"eval_overall_accuracy": 0.9611097349516968, |
|
"eval_overall_f1": 0.8240109140518418, |
|
"eval_overall_precision": 0.7803617571059431, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9948, |
|
"eval_samples_per_second": 187.983, |
|
"eval_steps_per_second": 3.016, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.542935848236084, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0324, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.7947019867549668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6715328467153285, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6052631578947368, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8958990536277602, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.8181818181818182, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7941176470588235, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.17356982827186584, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.819047619047619, |
|
"eval_overall_precision": 0.7737789203084833, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9929, |
|
"eval_samples_per_second": 188.343, |
|
"eval_steps_per_second": 3.022, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.2948610186576843, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0319, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.7919463087248322, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7375, |
|
"eval_LOCATION_recall": 0.855072463768116, |
|
"eval_ORGANIZATION_f1": 0.6865671641791045, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6301369863013698, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1768426150083542, |
|
"eval_overall_accuracy": 0.9608620262571216, |
|
"eval_overall_f1": 0.8224043715846995, |
|
"eval_overall_precision": 0.7797927461139896, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 1.0129, |
|
"eval_samples_per_second": 184.62, |
|
"eval_steps_per_second": 2.962, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 2.261873483657837, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0322, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8163265306122449, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.17177316546440125, |
|
"eval_overall_accuracy": 0.9618528610354223, |
|
"eval_overall_f1": 0.8262653898768809, |
|
"eval_overall_precision": 0.7844155844155845, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9871, |
|
"eval_samples_per_second": 189.451, |
|
"eval_steps_per_second": 3.039, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 0.4583621025085449, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0299, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6715328467153285, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6052631578947368, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8895899053627759, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1779460459947586, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.8152173913043478, |
|
"eval_overall_precision": 0.7692307692307693, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 1.0047, |
|
"eval_samples_per_second": 186.125, |
|
"eval_steps_per_second": 2.986, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.3838861882686615, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0291, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.7947019867549668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9056603773584905, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.787878787878788, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7647058823529411, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18026097118854523, |
|
"eval_overall_accuracy": 0.9606143175625464, |
|
"eval_overall_f1": 0.8217687074829931, |
|
"eval_overall_precision": 0.7763496143958869, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9947, |
|
"eval_samples_per_second": 187.989, |
|
"eval_steps_per_second": 3.016, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.7108933329582214, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0295, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.7947019867549668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6865671641791045, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6301369863013698, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9028213166144202, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8674698795180723, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18334877490997314, |
|
"eval_overall_accuracy": 0.9606143175625464, |
|
"eval_overall_f1": 0.8217687074829931, |
|
"eval_overall_precision": 0.7763496143958869, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9967, |
|
"eval_samples_per_second": 187.622, |
|
"eval_steps_per_second": 3.01, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.06356514245271683, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0288, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.7894736842105263, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.676470588235294, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6133333333333333, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8958990536277602, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1836617887020111, |
|
"eval_overall_accuracy": 0.9596234827842457, |
|
"eval_overall_f1": 0.814111261872456, |
|
"eval_overall_precision": 0.7672634271099744, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 1.0023, |
|
"eval_samples_per_second": 186.57, |
|
"eval_steps_per_second": 2.993, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 1.0761598348617554, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0286, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6969696969696969, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.647887323943662, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8958990536277602, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8658536585365854, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18496443331241608, |
|
"eval_overall_accuracy": 0.9596234827842457, |
|
"eval_overall_f1": 0.8174386920980926, |
|
"eval_overall_precision": 0.7731958762886598, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 0.9924, |
|
"eval_samples_per_second": 188.438, |
|
"eval_steps_per_second": 3.023, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.6377687454223633, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0296, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.7947019867549668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.7022900763358779, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7826086956521738, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18578113615512848, |
|
"eval_overall_accuracy": 0.9606143175625464, |
|
"eval_overall_f1": 0.8228882833787465, |
|
"eval_overall_precision": 0.7783505154639175, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9942, |
|
"eval_samples_per_second": 188.095, |
|
"eval_steps_per_second": 3.018, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.9133962392807007, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0291, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.7947019867549668, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6428571428571429, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.569620253164557, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.9056603773584905, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7761194029850746, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.19771257042884827, |
|
"eval_overall_accuracy": 0.9573941045330691, |
|
"eval_overall_f1": 0.8080536912751678, |
|
"eval_overall_precision": 0.7543859649122807, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9881, |
|
"eval_samples_per_second": 189.247, |
|
"eval_steps_per_second": 3.036, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.2774830758571625, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0286, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8053691275167786, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6923076923076924, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6521739130434783, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.8924050632911392, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7761194029850746, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18613538146018982, |
|
"eval_overall_accuracy": 0.9591280653950953, |
|
"eval_overall_f1": 0.8153214774281805, |
|
"eval_overall_precision": 0.7740259740259741, |
|
"eval_overall_recall": 0.861271676300578, |
|
"eval_runtime": 0.9926, |
|
"eval_samples_per_second": 188.388, |
|
"eval_steps_per_second": 3.022, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 0.32229432463645935, |
|
"learning_rate": 9e-06, |
|
"loss": 0.028, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6962962962962963, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6351351351351351, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.19613806903362274, |
|
"eval_overall_accuracy": 0.9596234827842457, |
|
"eval_overall_f1": 0.8222523744911805, |
|
"eval_overall_precision": 0.7749360613810742, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.999, |
|
"eval_samples_per_second": 187.18, |
|
"eval_steps_per_second": 3.003, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.18774951994419098, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0268, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6762589928057554, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6025641025641025, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.8895899053627759, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.7826086956521738, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1944919377565384, |
|
"eval_overall_accuracy": 0.9588803567005202, |
|
"eval_overall_f1": 0.8124156545209177, |
|
"eval_overall_precision": 0.7620253164556962, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9979, |
|
"eval_samples_per_second": 187.384, |
|
"eval_steps_per_second": 3.006, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 1.8088972568511963, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0274, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8163265306122449, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8695652173913043, |
|
"eval_ORGANIZATION_f1": 0.6956521739130435, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6233766233766234, |
|
"eval_ORGANIZATION_recall": 0.7868852459016393, |
|
"eval_PERSON_f1": 0.8924050632911392, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.7647058823529411, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8125, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1904267519712448, |
|
"eval_overall_accuracy": 0.9596234827842457, |
|
"eval_overall_f1": 0.8201634877384196, |
|
"eval_overall_precision": 0.7757731958762887, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9962, |
|
"eval_samples_per_second": 187.71, |
|
"eval_steps_per_second": 3.011, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.25640690326690674, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0272, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8187919463087248, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6818181818181818, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6338028169014085, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.8895899053627759, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.8181818181818182, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7941176470588235, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18857501447200775, |
|
"eval_overall_accuracy": 0.9611097349516968, |
|
"eval_overall_f1": 0.8241758241758242, |
|
"eval_overall_precision": 0.7853403141361257, |
|
"eval_overall_recall": 0.8670520231213873, |
|
"eval_runtime": 1.0634, |
|
"eval_samples_per_second": 175.846, |
|
"eval_steps_per_second": 2.821, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.6918984055519104, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0265, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8187919463087248, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6716417910447762, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6164383561643836, |
|
"eval_ORGANIZATION_recall": 0.7377049180327869, |
|
"eval_PERSON_f1": 0.8930817610062893, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8606060606060606, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.19140414893627167, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.8201634877384196, |
|
"eval_overall_precision": 0.7757731958762887, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9935, |
|
"eval_samples_per_second": 188.225, |
|
"eval_steps_per_second": 3.02, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.5062441229820251, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0264, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8243243243243245, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7721518987341772, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6911764705882353, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6266666666666667, |
|
"eval_ORGANIZATION_recall": 0.7704918032786885, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1898663192987442, |
|
"eval_overall_accuracy": 0.9611097349516968, |
|
"eval_overall_f1": 0.8283378746594006, |
|
"eval_overall_precision": 0.7835051546391752, |
|
"eval_overall_recall": 0.8786127167630058, |
|
"eval_runtime": 1.0004, |
|
"eval_samples_per_second": 186.919, |
|
"eval_steps_per_second": 2.999, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 0.9881439805030823, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0265, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8895899053627759, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18475988507270813, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.8179347826086956, |
|
"eval_overall_precision": 0.7717948717948718, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9985, |
|
"eval_samples_per_second": 187.283, |
|
"eval_steps_per_second": 3.005, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.8410730957984924, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0272, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6969696969696969, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.647887323943662, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8930817610062893, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8606060606060606, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18852190673351288, |
|
"eval_overall_accuracy": 0.961357443646272, |
|
"eval_overall_f1": 0.8240109140518418, |
|
"eval_overall_precision": 0.7803617571059431, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9938, |
|
"eval_samples_per_second": 188.167, |
|
"eval_steps_per_second": 3.019, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.46544983983039856, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0247, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6715328467153285, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6052631578947368, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8930817610062893, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8606060606060606, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.823529411764706, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7777777777777778, |
|
"eval_QUANTITY_recall": 0.875, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.19199509918689728, |
|
"eval_overall_accuracy": 0.9598711914788209, |
|
"eval_overall_f1": 0.8200270635994588, |
|
"eval_overall_precision": 0.7709923664122137, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 1.0076, |
|
"eval_samples_per_second": 185.591, |
|
"eval_steps_per_second": 2.977, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.5228121280670166, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0257, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8895899053627759, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.8059701492537314, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7714285714285715, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.18916358053684235, |
|
"eval_overall_accuracy": 0.9608620262571216, |
|
"eval_overall_f1": 0.8201634877384196, |
|
"eval_overall_precision": 0.7757731958762887, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.9851, |
|
"eval_samples_per_second": 189.831, |
|
"eval_steps_per_second": 3.045, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 1.0351158380508423, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0272, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6715328467153285, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6052631578947368, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8987341772151898, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.8181818181818182, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.7941176470588235, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.19310089945793152, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.8228882833787465, |
|
"eval_overall_precision": 0.7783505154639175, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 1.0032, |
|
"eval_samples_per_second": 186.402, |
|
"eval_steps_per_second": 2.99, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 1.0168826580047607, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0264, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6715328467153285, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6052631578947368, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8895899053627759, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.19347640872001648, |
|
"eval_overall_accuracy": 0.9588803567005202, |
|
"eval_overall_f1": 0.8157181571815717, |
|
"eval_overall_precision": 0.7678571428571429, |
|
"eval_overall_recall": 0.869942196531792, |
|
"eval_runtime": 0.994, |
|
"eval_samples_per_second": 188.123, |
|
"eval_steps_per_second": 3.018, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 1.8966048955917358, |
|
"learning_rate": 3e-06, |
|
"loss": 0.025, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6865671641791045, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6301369863013698, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.89937106918239, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8666666666666667, |
|
"eval_PERSON_recall": 0.934640522875817, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.1931447982788086, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.8244897959183674, |
|
"eval_overall_precision": 0.7789203084832905, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9943, |
|
"eval_samples_per_second": 188.071, |
|
"eval_steps_per_second": 3.017, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.3385007679462433, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0238, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9056603773584905, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.787878787878788, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.8387096774193549, |
|
"eval_loss": 0.19391222298145294, |
|
"eval_overall_accuracy": 0.9603666088679713, |
|
"eval_overall_f1": 0.8249660786974219, |
|
"eval_overall_precision": 0.7774936061381074, |
|
"eval_overall_recall": 0.8786127167630058, |
|
"eval_runtime": 1.0009, |
|
"eval_samples_per_second": 186.836, |
|
"eval_steps_per_second": 2.997, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.21799148619174957, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0253, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.676470588235294, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6133333333333333, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.9056603773584905, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.9411764705882353, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8181818181818182, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7714285714285715, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.19421541690826416, |
|
"eval_overall_accuracy": 0.9606143175625464, |
|
"eval_overall_f1": 0.8265582655826559, |
|
"eval_overall_precision": 0.7780612244897959, |
|
"eval_overall_recall": 0.8815028901734104, |
|
"eval_runtime": 1.1499, |
|
"eval_samples_per_second": 162.627, |
|
"eval_steps_per_second": 2.609, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.6869099736213684, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0258, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8895899053627759, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9215686274509803, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8307692307692308, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7941176470588235, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.19163855910301208, |
|
"eval_overall_accuracy": 0.9603666088679713, |
|
"eval_overall_f1": 0.8217687074829931, |
|
"eval_overall_precision": 0.7763496143958869, |
|
"eval_overall_recall": 0.8728323699421965, |
|
"eval_runtime": 0.9961, |
|
"eval_samples_per_second": 187.732, |
|
"eval_steps_per_second": 3.012, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.3732462525367737, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0237, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6715328467153285, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6052631578947368, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8930817610062893, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8606060606060606, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8307692307692308, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7941176470588235, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.19394682347774506, |
|
"eval_overall_accuracy": 0.9601189001733961, |
|
"eval_overall_f1": 0.8211382113821138, |
|
"eval_overall_precision": 0.7729591836734694, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 1.0582, |
|
"eval_samples_per_second": 176.711, |
|
"eval_steps_per_second": 2.835, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.2899250090122223, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0236, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.676470588235294, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6133333333333333, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8930817610062893, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8606060606060606, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8307692307692308, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7941176470588235, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.1942683607339859, |
|
"eval_overall_accuracy": 0.9603666088679713, |
|
"eval_overall_f1": 0.8222523744911805, |
|
"eval_overall_precision": 0.7749360613810742, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 0.9864, |
|
"eval_samples_per_second": 189.57, |
|
"eval_steps_per_second": 3.041, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.24946770071983337, |
|
"learning_rate": 0.0, |
|
"loss": 0.0266, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.8133333333333332, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.676470588235294, |
|
"eval_ORGANIZATION_number": 61, |
|
"eval_ORGANIZATION_precision": 0.6133333333333333, |
|
"eval_ORGANIZATION_recall": 0.7540983606557377, |
|
"eval_PERSON_f1": 0.8930817610062893, |
|
"eval_PERSON_number": 153, |
|
"eval_PERSON_precision": 0.8606060606060606, |
|
"eval_PERSON_recall": 0.9281045751633987, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 32, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.84375, |
|
"eval_TIME_f1": 0.8307692307692308, |
|
"eval_TIME_number": 31, |
|
"eval_TIME_precision": 0.7941176470588235, |
|
"eval_TIME_recall": 0.8709677419354839, |
|
"eval_loss": 0.19379286468029022, |
|
"eval_overall_accuracy": 0.9603666088679713, |
|
"eval_overall_f1": 0.8222523744911805, |
|
"eval_overall_precision": 0.7749360613810742, |
|
"eval_overall_recall": 0.8757225433526011, |
|
"eval_runtime": 1.0035, |
|
"eval_samples_per_second": 186.351, |
|
"eval_steps_per_second": 2.99, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 5088556202474382.0, |
|
"train_loss": 0.07152380032359429, |
|
"train_runtime": 1385.5436, |
|
"train_samples_per_second": 121.757, |
|
"train_steps_per_second": 7.65 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 5088556202474382.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|