|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 0.8392817974090576, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9688, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.0879120879120879, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.26666666666666666, |
|
"eval_PERSON_recall": 0.05263157894736842, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.5576337575912476, |
|
"eval_overall_accuracy": 0.8432778489116517, |
|
"eval_overall_f1": 0.042666666666666665, |
|
"eval_overall_precision": 0.21621621621621623, |
|
"eval_overall_recall": 0.023668639053254437, |
|
"eval_runtime": 0.3335, |
|
"eval_samples_per_second": 560.647, |
|
"eval_steps_per_second": 8.994, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.1076773405075073, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.4767, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.288659793814433, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.5, |
|
"eval_LOCATION_recall": 0.2028985507246377, |
|
"eval_ORGANIZATION_f1": 0.07058823529411765, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.1111111111111111, |
|
"eval_ORGANIZATION_recall": 0.05172413793103448, |
|
"eval_PERSON_f1": 0.5936739659367396, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.47104247104247104, |
|
"eval_PERSON_recall": 0.8026315789473685, |
|
"eval_QUANTITY_f1": 0.11111111111111112, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.125, |
|
"eval_QUANTITY_recall": 0.1, |
|
"eval_TIME_f1": 0.523076923076923, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.4722222222222222, |
|
"eval_TIME_recall": 0.5862068965517241, |
|
"eval_loss": 0.31268012523651123, |
|
"eval_overall_accuracy": 0.8991037131882202, |
|
"eval_overall_f1": 0.44662921348314605, |
|
"eval_overall_precision": 0.42513368983957217, |
|
"eval_overall_recall": 0.47041420118343197, |
|
"eval_runtime": 0.3348, |
|
"eval_samples_per_second": 558.483, |
|
"eval_steps_per_second": 8.96, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.2600445747375488, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.2969, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.6303030303030303, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.5416666666666666, |
|
"eval_LOCATION_recall": 0.7536231884057971, |
|
"eval_ORGANIZATION_f1": 0.4605263157894736, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.3723404255319149, |
|
"eval_ORGANIZATION_recall": 0.603448275862069, |
|
"eval_PERSON_f1": 0.8085106382978723, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.751412429378531, |
|
"eval_PERSON_recall": 0.875, |
|
"eval_QUANTITY_f1": 0.7027027027027029, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5909090909090909, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7301587301587301, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6764705882352942, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.22261539101600647, |
|
"eval_overall_accuracy": 0.9275288092189501, |
|
"eval_overall_f1": 0.6871008939974458, |
|
"eval_overall_precision": 0.604494382022472, |
|
"eval_overall_recall": 0.7958579881656804, |
|
"eval_runtime": 0.333, |
|
"eval_samples_per_second": 561.501, |
|
"eval_steps_per_second": 9.008, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.1735649108886719, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2125, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.7346938775510203, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6923076923076923, |
|
"eval_LOCATION_recall": 0.782608695652174, |
|
"eval_ORGANIZATION_f1": 0.5354330708661417, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.4927536231884058, |
|
"eval_ORGANIZATION_recall": 0.5862068965517241, |
|
"eval_PERSON_f1": 0.8288288288288289, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7624309392265194, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.6944444444444444, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5952380952380952, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7076923076923076, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6388888888888888, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.17351830005645752, |
|
"eval_overall_accuracy": 0.9400768245838669, |
|
"eval_overall_f1": 0.7365591397849461, |
|
"eval_overall_precision": 0.6748768472906403, |
|
"eval_overall_recall": 0.8106508875739645, |
|
"eval_runtime": 0.3365, |
|
"eval_samples_per_second": 555.787, |
|
"eval_steps_per_second": 8.916, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.4631017446517944, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.1759, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.6762589928057554, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.6714285714285714, |
|
"eval_LOCATION_recall": 0.6811594202898551, |
|
"eval_ORGANIZATION_f1": 0.6056338028169014, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5119047619047619, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8466257668711656, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.7931034482758621, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8275862068965517, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8275862068965517, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14357861876487732, |
|
"eval_overall_accuracy": 0.9475032010243278, |
|
"eval_overall_f1": 0.7540983606557377, |
|
"eval_overall_precision": 0.700507614213198, |
|
"eval_overall_recall": 0.8165680473372781, |
|
"eval_runtime": 0.3351, |
|
"eval_samples_per_second": 558.08, |
|
"eval_steps_per_second": 8.953, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 0.8950690627098083, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1548, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8840579710144928, |
|
"eval_ORGANIZATION_f1": 0.6811594202898551, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5875, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8518518518518517, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8023255813953488, |
|
"eval_PERSON_recall": 0.9078947368421053, |
|
"eval_QUANTITY_f1": 0.7142857142857143, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14464175701141357, |
|
"eval_overall_accuracy": 0.952112676056338, |
|
"eval_overall_f1": 0.7866666666666666, |
|
"eval_overall_precision": 0.7160194174757282, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3323, |
|
"eval_samples_per_second": 562.696, |
|
"eval_steps_per_second": 9.027, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 0.48694196343421936, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1452, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.8289473684210527, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6870229007633589, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6164383561643836, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.875, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8333333333333334, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.6153846153846154, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14724624156951904, |
|
"eval_overall_accuracy": 0.9510883482714468, |
|
"eval_overall_f1": 0.7967698519515478, |
|
"eval_overall_precision": 0.7308641975308642, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3323, |
|
"eval_samples_per_second": 562.777, |
|
"eval_steps_per_second": 9.029, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.39879658818244934, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1368, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.8378378378378378, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7848101265822784, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7142857142857144, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6097560975609756, |
|
"eval_ORGANIZATION_recall": 0.8620689655172413, |
|
"eval_PERSON_f1": 0.8722741433021807, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8284023668639053, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.6376811594202898, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.55, |
|
"eval_TIME_recall": 0.7586206896551724, |
|
"eval_loss": 0.1397438496351242, |
|
"eval_overall_accuracy": 0.9539052496798975, |
|
"eval_overall_f1": 0.8026845637583893, |
|
"eval_overall_precision": 0.7346437346437347, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.3334, |
|
"eval_samples_per_second": 560.876, |
|
"eval_steps_per_second": 8.998, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.2802802324295044, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1278, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.8258064516129032, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7441860465116279, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.5950413223140496, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5714285714285714, |
|
"eval_ORGANIZATION_recall": 0.6206896551724138, |
|
"eval_PERSON_f1": 0.8623853211009175, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8057142857142857, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.6571428571428573, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.5609756097560976, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.14592860639095306, |
|
"eval_overall_accuracy": 0.9528809218950064, |
|
"eval_overall_f1": 0.7800269905533064, |
|
"eval_overall_precision": 0.71712158808933, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.31, |
|
"eval_steps_per_second": 8.973, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.4159973859786987, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1202, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6614173228346457, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.877742946708464, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8383233532934131, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.6944444444444444, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5952380952380952, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8064516129032258, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.13962122797966003, |
|
"eval_overall_accuracy": 0.9559539052496799, |
|
"eval_overall_f1": 0.8, |
|
"eval_overall_precision": 0.7405541561712846, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.3332, |
|
"eval_samples_per_second": 561.16, |
|
"eval_steps_per_second": 9.003, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 1.0556025505065918, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1166, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.8552631578947367, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7831325301204819, |
|
"eval_LOCATION_recall": 0.9420289855072463, |
|
"eval_ORGANIZATION_f1": 0.6515151515151516, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.581081081081081, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.88125, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8392857142857143, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.6944444444444444, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5952380952380952, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13871203362941742, |
|
"eval_overall_accuracy": 0.9556978233034571, |
|
"eval_overall_f1": 0.8054054054054053, |
|
"eval_overall_precision": 0.7412935323383084, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3363, |
|
"eval_samples_per_second": 556.023, |
|
"eval_steps_per_second": 8.92, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.1935970783233643, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1108, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.5641025641025641, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.559322033898305, |
|
"eval_ORGANIZATION_recall": 0.5689655172413793, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13067495822906494, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8062234794908061, |
|
"eval_overall_precision": 0.7723577235772358, |
|
"eval_overall_recall": 0.8431952662721893, |
|
"eval_runtime": 0.3341, |
|
"eval_samples_per_second": 559.688, |
|
"eval_steps_per_second": 8.979, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.38182273507118225, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1052, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.8476821192052981, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.71875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6571428571428571, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8952380952380953, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13124220073223114, |
|
"eval_overall_accuracy": 0.9613316261203585, |
|
"eval_overall_f1": 0.8282548476454293, |
|
"eval_overall_precision": 0.7786458333333334, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.3361, |
|
"eval_samples_per_second": 556.458, |
|
"eval_steps_per_second": 8.927, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.8100732564926147, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.104, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6991869918699186, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6615384615384615, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.9085173501577286, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.9473684210526315, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7419354838709677, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.696969696969697, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.13739244639873505, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.8284518828451882, |
|
"eval_overall_precision": 0.783641160949868, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3335, |
|
"eval_samples_per_second": 560.761, |
|
"eval_steps_per_second": 8.996, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.0627801418304443, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.0963, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.8366013071895425, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6610169491525424, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.9102564102564101, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8875, |
|
"eval_PERSON_recall": 0.9342105263157895, |
|
"eval_QUANTITY_f1": 0.6233766233766233, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5106382978723404, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.13979628682136536, |
|
"eval_overall_accuracy": 0.9572343149807938, |
|
"eval_overall_f1": 0.8116343490304708, |
|
"eval_overall_precision": 0.7630208333333334, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.3344, |
|
"eval_samples_per_second": 559.247, |
|
"eval_steps_per_second": 8.972, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 0.8222811222076416, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.0952, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8311688311688311, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7343749999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6714285714285714, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.9067524115755626, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.676056338028169, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5853658536585366, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14147908985614777, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8287292817679558, |
|
"eval_overall_precision": 0.7772020725388601, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3348, |
|
"eval_samples_per_second": 558.612, |
|
"eval_steps_per_second": 8.962, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.7422318458557129, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0902, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.8533333333333333, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7000000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5975609756097561, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.89171974522293, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.6315789473684211, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5217391304347826, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7540983606557378, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.71875, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.14226044714450836, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8097165991902834, |
|
"eval_overall_precision": 0.7444168734491315, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.424, |
|
"eval_steps_per_second": 8.975, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.5720771551132202, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0919, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6976744186046512, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6338028169014085, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.9113924050632912, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8780487804878049, |
|
"eval_PERSON_recall": 0.9473684210526315, |
|
"eval_QUANTITY_f1": 0.676056338028169, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5853658536585366, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7301587301587301, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6764705882352942, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.14349369704723358, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8275862068965517, |
|
"eval_overall_precision": 0.7751937984496124, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3339, |
|
"eval_samples_per_second": 560.088, |
|
"eval_steps_per_second": 8.985, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 1.00640070438385, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.0864, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6885245901639345, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.65625, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.9050632911392406, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.64, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5333333333333333, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7796610169491527, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7666666666666667, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.14329810440540314, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.8205841446453407, |
|
"eval_overall_precision": 0.7742782152230971, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.338, |
|
"eval_samples_per_second": 553.255, |
|
"eval_steps_per_second": 8.876, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.7463036179542542, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0853, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7230769230769231, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6527777777777778, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.9137380191693291, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8881987577639752, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7540983606557378, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.71875, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.13515153527259827, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.8431372549019608, |
|
"eval_overall_precision": 0.800531914893617, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.3312, |
|
"eval_samples_per_second": 564.613, |
|
"eval_steps_per_second": 9.058, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 0.4474703073501587, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0782, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8322147651006713, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.696969696969697, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6216216216216216, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.9050632911392406, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1520513892173767, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.8241758241758241, |
|
"eval_overall_precision": 0.7692307692307693, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3358, |
|
"eval_samples_per_second": 556.946, |
|
"eval_steps_per_second": 8.935, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.46933385729789734, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0778, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.8533333333333333, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7259259259259259, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8952380952380953, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14189890027046204, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8308115543328748, |
|
"eval_overall_precision": 0.7763496143958869, |
|
"eval_overall_recall": 0.893491124260355, |
|
"eval_runtime": 0.3349, |
|
"eval_samples_per_second": 558.354, |
|
"eval_steps_per_second": 8.958, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 0.5191448330879211, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0751, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6976744186046512, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6338028169014085, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.9015873015873016, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9342105263157895, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1431107521057129, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8243430152143846, |
|
"eval_overall_precision": 0.7740259740259741, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3347, |
|
"eval_samples_per_second": 558.691, |
|
"eval_steps_per_second": 8.963, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.5136590003967285, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0761, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6935483870967741, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6515151515151515, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.9079365079365079, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8773006134969326, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7058823529411765, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1410786360502243, |
|
"eval_overall_accuracy": 0.9633802816901409, |
|
"eval_overall_f1": 0.8394366197183097, |
|
"eval_overall_precision": 0.8010752688172043, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3473, |
|
"eval_samples_per_second": 538.469, |
|
"eval_steps_per_second": 8.639, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.8224151134490967, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0718, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6923076923076923, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.9079365079365079, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8773006134969326, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.64, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5333333333333333, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7301587301587301, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6764705882352942, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.15752357244491577, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.8164383561643835, |
|
"eval_overall_precision": 0.7602040816326531, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3326, |
|
"eval_samples_per_second": 562.261, |
|
"eval_steps_per_second": 9.02, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 1.1950877904891968, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0706, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.8551724137931034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7213114754098361, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.9166666666666667, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.89375, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.14247971773147583, |
|
"eval_overall_accuracy": 0.9623559539052496, |
|
"eval_overall_f1": 0.8389830508474576, |
|
"eval_overall_precision": 0.8027027027027027, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3335, |
|
"eval_samples_per_second": 560.748, |
|
"eval_steps_per_second": 8.996, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.48883256316185, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0675, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7101449275362319, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6125, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.890282131661442, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8502994011976048, |
|
"eval_PERSON_recall": 0.9342105263157895, |
|
"eval_QUANTITY_f1": 0.6857142857142857, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.16071684658527374, |
|
"eval_overall_accuracy": 0.9559539052496799, |
|
"eval_overall_f1": 0.819538670284939, |
|
"eval_overall_precision": 0.7568922305764411, |
|
"eval_overall_recall": 0.893491124260355, |
|
"eval_runtime": 0.3357, |
|
"eval_samples_per_second": 557.057, |
|
"eval_steps_per_second": 8.937, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 5.45798397064209, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0692, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8832807570977917, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7301587301587301, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6764705882352942, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.14975115656852722, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8205841446453407, |
|
"eval_overall_precision": 0.7742782152230971, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3351, |
|
"eval_samples_per_second": 558.088, |
|
"eval_steps_per_second": 8.953, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.3084903359413147, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0663, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.84, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7777777777777778, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7000000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5975609756097561, |
|
"eval_ORGANIZATION_recall": 0.8448275862068966, |
|
"eval_PERSON_f1": 0.8924050632911392, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.148148775100708, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8201634877384196, |
|
"eval_overall_precision": 0.76010101010101, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.3329, |
|
"eval_samples_per_second": 561.66, |
|
"eval_steps_per_second": 9.011, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 1.554962396621704, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0642, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6612903225806452, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6212121212121212, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.889589905362776, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8545454545454545, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.8253968253968254, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7878787878787878, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.14457598328590393, |
|
"eval_overall_accuracy": 0.963124199743918, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3355, |
|
"eval_samples_per_second": 557.403, |
|
"eval_steps_per_second": 8.942, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.40657302737236023, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0602, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.65625, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8924050632911392, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1596260815858841, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.8189415041782729, |
|
"eval_overall_precision": 0.7736842105263158, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.3328, |
|
"eval_samples_per_second": 561.9, |
|
"eval_steps_per_second": 9.014, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.3220694363117218, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0618, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7258064516129032, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6818181818181818, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8980891719745223, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.676056338028169, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5853658536585366, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7540983606557378, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.71875, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.15103064477443695, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.82336578581363, |
|
"eval_overall_precision": 0.7769028871391076, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.336, |
|
"eval_samples_per_second": 556.607, |
|
"eval_steps_per_second": 8.93, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 1.0746521949768066, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0587, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6976744186046512, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6338028169014085, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.9050632911392406, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8719512195121951, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.15125295519828796, |
|
"eval_overall_accuracy": 0.9636363636363636, |
|
"eval_overall_f1": 0.840782122905028, |
|
"eval_overall_precision": 0.7962962962962963, |
|
"eval_overall_recall": 0.8905325443786982, |
|
"eval_runtime": 0.3377, |
|
"eval_samples_per_second": 553.74, |
|
"eval_steps_per_second": 8.884, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 1.5852210521697998, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0575, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8435374149659864, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7948717948717948, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.7175572519083969, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6438356164383562, |
|
"eval_ORGANIZATION_recall": 0.8103448275862069, |
|
"eval_PERSON_f1": 0.8924050632911392, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.6857142857142857, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.696969696969697, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6216216216216216, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.17214131355285645, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.8136986301369863, |
|
"eval_overall_precision": 0.7576530612244898, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.332, |
|
"eval_samples_per_second": 563.205, |
|
"eval_steps_per_second": 9.035, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.709221601486206, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0568, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.736, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6865671641791045, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.889589905362776, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8545454545454545, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.6956521739130435, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6153846153846154, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7666666666666667, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7419354838709677, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.16309089958667755, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8312412831241283, |
|
"eval_overall_precision": 0.7862796833773087, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3342, |
|
"eval_samples_per_second": 559.545, |
|
"eval_steps_per_second": 8.977, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.5662766098976135, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.058, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8671328671328672, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.711111111111111, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6233766233766234, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.9079365079365079, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8773006134969326, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.15275219082832336, |
|
"eval_overall_accuracy": 0.9618437900128041, |
|
"eval_overall_f1": 0.8412256267409471, |
|
"eval_overall_precision": 0.7947368421052632, |
|
"eval_overall_recall": 0.893491124260355, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.388, |
|
"eval_steps_per_second": 8.974, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 0.11498302221298218, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0542, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6285714285714286, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.9015873015873016, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9342105263157895, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1606374979019165, |
|
"eval_overall_accuracy": 0.9597951344430218, |
|
"eval_overall_f1": 0.8272980501392758, |
|
"eval_overall_precision": 0.781578947368421, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.334, |
|
"eval_samples_per_second": 559.858, |
|
"eval_steps_per_second": 8.982, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.5296043157577515, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0543, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8456375838926175, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6153846153846154, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.9038461538461539, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.88125, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.6666666666666666, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5714285714285714, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.16339102387428284, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.8207934336525308, |
|
"eval_overall_precision": 0.7633587786259542, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3345, |
|
"eval_samples_per_second": 559.005, |
|
"eval_steps_per_second": 8.968, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.7791297435760498, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0545, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6929133858267716, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6376811594202898, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.78125, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7352941176470589, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.15971286594867706, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.8302945301542777, |
|
"eval_overall_precision": 0.7893333333333333, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3358, |
|
"eval_samples_per_second": 556.857, |
|
"eval_steps_per_second": 8.934, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 1.3748724460601807, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0522, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8571428571428572, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8076923076923077, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7166666666666668, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6935483870967742, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.8059701492537312, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.15032222867012024, |
|
"eval_overall_accuracy": 0.9626120358514725, |
|
"eval_overall_f1": 0.8366197183098592, |
|
"eval_overall_precision": 0.7983870967741935, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3322, |
|
"eval_samples_per_second": 562.995, |
|
"eval_steps_per_second": 9.032, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.5511608719825745, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0484, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6984126984126984, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7540983606557378, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.71875, |
|
"eval_TIME_recall": 0.7931034482758621, |
|
"eval_loss": 0.16514161229133606, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8263305322128851, |
|
"eval_overall_precision": 0.7845744680851063, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3352, |
|
"eval_samples_per_second": 557.858, |
|
"eval_steps_per_second": 8.95, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.6805091500282288, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0472, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.8671328671328672, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6984126984126984, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.9096774193548387, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.16605274379253387, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8321579689703809, |
|
"eval_overall_precision": 0.7951482479784366, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3329, |
|
"eval_samples_per_second": 561.686, |
|
"eval_steps_per_second": 9.011, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 3.199406147003174, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0498, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7040000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6567164179104478, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.9067524115755626, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.8059701492537312, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.155135378241539, |
|
"eval_overall_accuracy": 0.9628681177976952, |
|
"eval_overall_f1": 0.8422535211267606, |
|
"eval_overall_precision": 0.803763440860215, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.3322, |
|
"eval_samples_per_second": 562.861, |
|
"eval_steps_per_second": 9.03, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 1.2136147022247314, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0474, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7154471544715447, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.676923076923077, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8867924528301887, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8493975903614458, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1694120317697525, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.8314606741573034, |
|
"eval_overall_precision": 0.7914438502673797, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3337, |
|
"eval_samples_per_second": 560.411, |
|
"eval_steps_per_second": 8.991, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 1.1127651929855347, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0483, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8551724137931034, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8157894736842105, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.6929133858267716, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6376811594202898, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.6388888888888888, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.5476190476190477, |
|
"eval_QUANTITY_recall": 0.7666666666666667, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.17468813061714172, |
|
"eval_overall_accuracy": 0.954673495518566, |
|
"eval_overall_f1": 0.8138888888888889, |
|
"eval_overall_precision": 0.7670157068062827, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.3348, |
|
"eval_samples_per_second": 558.469, |
|
"eval_steps_per_second": 8.959, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.21913494169712067, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.045, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8513513513513514, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.7974683544303798, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6942148760330579, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.89171974522293, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7272727272727273, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6486486486486487, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1735159456729889, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.8200836820083682, |
|
"eval_overall_precision": 0.7757255936675461, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.3358, |
|
"eval_samples_per_second": 556.961, |
|
"eval_steps_per_second": 8.935, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.8087287545204163, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0431, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6829268292682927, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6461538461538462, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8860759493670887, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.17915095388889313, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.8207282913165266, |
|
"eval_overall_precision": 0.7792553191489362, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.3356, |
|
"eval_samples_per_second": 557.259, |
|
"eval_steps_per_second": 8.94, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 1.3942605257034302, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0424, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8648648648648648, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7419354838709677, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.696969696969697, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8924050632911392, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1734819859266281, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8340306834030683, |
|
"eval_overall_precision": 0.7889182058047494, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.335, |
|
"eval_samples_per_second": 558.27, |
|
"eval_steps_per_second": 8.956, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.8996381759643555, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0426, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7441860465116279, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.676056338028169, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.8867924528301887, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8493975903614458, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.8181818181818182, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.75, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.17559018731117249, |
|
"eval_overall_accuracy": 0.9597951344430218, |
|
"eval_overall_f1": 0.8381742738589212, |
|
"eval_overall_precision": 0.787012987012987, |
|
"eval_overall_recall": 0.8964497041420119, |
|
"eval_runtime": 0.3329, |
|
"eval_samples_per_second": 561.775, |
|
"eval_steps_per_second": 9.012, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 0.22222945094108582, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0412, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6548672566371682, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6727272727272727, |
|
"eval_ORGANIZATION_recall": 0.6379310344827587, |
|
"eval_PERSON_f1": 0.8832807570977917, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.16795222461223602, |
|
"eval_overall_accuracy": 0.9597951344430218, |
|
"eval_overall_f1": 0.8295454545454545, |
|
"eval_overall_precision": 0.7978142076502732, |
|
"eval_overall_recall": 0.863905325443787, |
|
"eval_runtime": 0.3341, |
|
"eval_samples_per_second": 559.727, |
|
"eval_steps_per_second": 8.98, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.7834493517875671, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0407, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.870748299319728, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8205128205128205, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6557377049180328, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.9015873015873016, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9342105263157895, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.17565281689167023, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8286516853932584, |
|
"eval_overall_precision": 0.7887700534759359, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3349, |
|
"eval_samples_per_second": 558.379, |
|
"eval_steps_per_second": 8.958, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.5259361863136292, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0421, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7142857142857142, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6617647058823529, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.18448342382907867, |
|
"eval_overall_accuracy": 0.9587708066581306, |
|
"eval_overall_f1": 0.83008356545961, |
|
"eval_overall_precision": 0.7842105263157895, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3359, |
|
"eval_samples_per_second": 556.686, |
|
"eval_steps_per_second": 8.931, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 1.3698176145553589, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0415, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7142857142857142, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6617647058823529, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.180740624666214, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8379888268156425, |
|
"eval_overall_precision": 0.7936507936507936, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3346, |
|
"eval_samples_per_second": 558.915, |
|
"eval_steps_per_second": 8.967, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.6899826526641846, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0378, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6615384615384615, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5972222222222222, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.8059701492537312, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1903461366891861, |
|
"eval_overall_accuracy": 0.9587708066581306, |
|
"eval_overall_f1": 0.8250000000000001, |
|
"eval_overall_precision": 0.7774869109947644, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3444, |
|
"eval_samples_per_second": 542.946, |
|
"eval_steps_per_second": 8.71, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 1.0006171464920044, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0388, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7166666666666668, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6935483870967742, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8980891719745223, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.18361018598079681, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.8326300984528833, |
|
"eval_overall_precision": 0.7935656836461126, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3373, |
|
"eval_samples_per_second": 554.414, |
|
"eval_steps_per_second": 8.894, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.8649386167526245, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0381, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.89171974522293, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7647058823529413, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.17993959784507751, |
|
"eval_overall_accuracy": 0.9595390524967989, |
|
"eval_overall_f1": 0.8382559774964837, |
|
"eval_overall_precision": 0.7989276139410187, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3352, |
|
"eval_samples_per_second": 557.898, |
|
"eval_steps_per_second": 8.95, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.5134249925613403, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0377, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6451612903225807, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6060606060606061, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.8797468354430381, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7941176470588235, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.7692307692307692, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6944444444444444, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1980062872171402, |
|
"eval_overall_accuracy": 0.9554417413572344, |
|
"eval_overall_f1": 0.8189415041782729, |
|
"eval_overall_precision": 0.7736842105263158, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.3364, |
|
"eval_samples_per_second": 555.829, |
|
"eval_steps_per_second": 8.917, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 1.7326457500457764, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0382, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8671328671328672, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.8985507246376812, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8980891719745223, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7352941176470588, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1960817277431488, |
|
"eval_overall_accuracy": 0.9562099871959027, |
|
"eval_overall_f1": 0.8274894810659188, |
|
"eval_overall_precision": 0.7866666666666666, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3347, |
|
"eval_samples_per_second": 558.716, |
|
"eval_steps_per_second": 8.963, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 0.785622239112854, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0358, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6984126984126984, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8952380952380953, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7536231884057971, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.1875164657831192, |
|
"eval_overall_accuracy": 0.9600512163892445, |
|
"eval_overall_f1": 0.835195530726257, |
|
"eval_overall_precision": 0.791005291005291, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.3334, |
|
"eval_samples_per_second": 560.851, |
|
"eval_steps_per_second": 8.998, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.8723583221435547, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0355, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.703125, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.7758620689655172, |
|
"eval_PERSON_f1": 0.8938906752411576, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7164179104477612, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6486486486486487, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8196721311475409, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.19338777661323547, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.8314606741573034, |
|
"eval_overall_precision": 0.7914438502673797, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3431, |
|
"eval_samples_per_second": 544.973, |
|
"eval_steps_per_second": 8.743, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.1464908123016357, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.037, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6929133858267716, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6376811594202898, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7647058823529413, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.18568746745586395, |
|
"eval_overall_accuracy": 0.9592829705505762, |
|
"eval_overall_f1": 0.829608938547486, |
|
"eval_overall_precision": 0.7857142857142857, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3342, |
|
"eval_samples_per_second": 559.582, |
|
"eval_steps_per_second": 8.977, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.577111542224884, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0342, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.671875, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6142857142857143, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.19420312345027924, |
|
"eval_overall_accuracy": 0.9564660691421255, |
|
"eval_overall_f1": 0.8184357541899442, |
|
"eval_overall_precision": 0.7751322751322751, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.3361, |
|
"eval_samples_per_second": 556.377, |
|
"eval_steps_per_second": 8.926, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.4379956126213074, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0349, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.888888888888889, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8533333333333334, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6942148760330579, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8924050632911392, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8597560975609756, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.8059701492537312, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.18639543652534485, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8450704225352114, |
|
"eval_overall_precision": 0.8064516129032258, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.339, |
|
"eval_samples_per_second": 551.625, |
|
"eval_steps_per_second": 8.85, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 1.331531286239624, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0316, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6814814814814815, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5974025974025974, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9144736842105263, |
|
"eval_QUANTITY_f1": 0.7647058823529413, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.19557389616966248, |
|
"eval_overall_accuracy": 0.9554417413572344, |
|
"eval_overall_f1": 0.8209366391184573, |
|
"eval_overall_precision": 0.7680412371134021, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3402, |
|
"eval_samples_per_second": 549.599, |
|
"eval_steps_per_second": 8.817, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 0.3099250793457031, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0358, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6808510638297872, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.5783132530120482, |
|
"eval_ORGANIZATION_recall": 0.8275862068965517, |
|
"eval_PERSON_f1": 0.9015873015873016, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9342105263157895, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.19938279688358307, |
|
"eval_overall_accuracy": 0.9567221510883482, |
|
"eval_overall_f1": 0.8290013679890562, |
|
"eval_overall_precision": 0.7709923664122137, |
|
"eval_overall_recall": 0.8964497041420119, |
|
"eval_runtime": 0.3388, |
|
"eval_samples_per_second": 551.909, |
|
"eval_steps_per_second": 8.854, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.5862748026847839, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0317, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6559999999999999, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6119402985074627, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8952380952380953, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7058823529411765, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.631578947368421, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.21487130224704742, |
|
"eval_overall_accuracy": 0.9556978233034571, |
|
"eval_overall_f1": 0.8200836820083682, |
|
"eval_overall_precision": 0.7757255936675461, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.3359, |
|
"eval_samples_per_second": 556.74, |
|
"eval_steps_per_second": 8.932, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.5351269841194153, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0335, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7040000000000001, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6567164179104478, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.9079365079365079, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8773006134969326, |
|
"eval_PERSON_recall": 0.9407894736842105, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8253968253968255, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1979534924030304, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8391608391608392, |
|
"eval_overall_precision": 0.7957559681697612, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3372, |
|
"eval_samples_per_second": 554.49, |
|
"eval_steps_per_second": 8.896, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.3918878138065338, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0333, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.889589905362776, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8545454545454545, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7384615384615385, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.1945626586675644, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8222222222222222, |
|
"eval_overall_precision": 0.774869109947644, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3368, |
|
"eval_samples_per_second": 555.197, |
|
"eval_steps_per_second": 8.907, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.9337367415428162, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0311, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6991869918699186, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6615384615384615, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.19715982675552368, |
|
"eval_overall_accuracy": 0.9605633802816902, |
|
"eval_overall_f1": 0.8470254957507082, |
|
"eval_overall_precision": 0.8125, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.3336, |
|
"eval_samples_per_second": 560.63, |
|
"eval_steps_per_second": 8.994, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 1.763173222541809, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0314, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7049180327868853, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.671875, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8980891719745223, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.2073572725057602, |
|
"eval_overall_accuracy": 0.9572343149807938, |
|
"eval_overall_f1": 0.8342696629213484, |
|
"eval_overall_precision": 0.7941176470588235, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.3, |
|
"eval_steps_per_second": 8.973, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.9943879842758179, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0317, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.7301587301587301, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6764705882352942, |
|
"eval_ORGANIZATION_recall": 0.7931034482758621, |
|
"eval_PERSON_f1": 0.9044585987261147, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8765432098765432, |
|
"eval_PERSON_recall": 0.9342105263157895, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7272727272727273, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6486486486486487, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.21239928901195526, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.8344923504867873, |
|
"eval_overall_precision": 0.7874015748031497, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3359, |
|
"eval_samples_per_second": 556.631, |
|
"eval_steps_per_second": 8.93, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.39654669165611267, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0297, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.881118881118881, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8513513513513513, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6379310344827587, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6379310344827587, |
|
"eval_ORGANIZATION_recall": 0.6379310344827587, |
|
"eval_PERSON_f1": 0.9009584664536742, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.2062947303056717, |
|
"eval_overall_accuracy": 0.9567221510883482, |
|
"eval_overall_f1": 0.8233618233618234, |
|
"eval_overall_precision": 0.7939560439560439, |
|
"eval_overall_recall": 0.8550295857988166, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.346, |
|
"eval_steps_per_second": 8.973, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.2321532964706421, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0293, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6825396825396826, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6323529411764706, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.9015873015873016, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8711656441717791, |
|
"eval_PERSON_recall": 0.9342105263157895, |
|
"eval_QUANTITY_f1": 0.8059701492537312, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.9, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.20541173219680786, |
|
"eval_overall_accuracy": 0.9603072983354674, |
|
"eval_overall_f1": 0.8435754189944134, |
|
"eval_overall_precision": 0.798941798941799, |
|
"eval_overall_recall": 0.893491124260355, |
|
"eval_runtime": 0.3355, |
|
"eval_samples_per_second": 557.322, |
|
"eval_steps_per_second": 8.941, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 2.329578399658203, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0303, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6176470588235294, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8980891719745223, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7619047619047619, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7058823529411765, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.20924483239650726, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.8240223463687152, |
|
"eval_overall_precision": 0.7804232804232805, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3356, |
|
"eval_samples_per_second": 557.229, |
|
"eval_steps_per_second": 8.939, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.4096578359603882, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0319, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6829268292682927, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6461538461538462, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.89171974522293, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7384615384615385, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.21165302395820618, |
|
"eval_overall_accuracy": 0.9567221510883482, |
|
"eval_overall_f1": 0.8230337078651686, |
|
"eval_overall_precision": 0.7834224598930482, |
|
"eval_overall_recall": 0.8668639053254438, |
|
"eval_runtime": 0.3352, |
|
"eval_samples_per_second": 557.866, |
|
"eval_steps_per_second": 8.95, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.22333945333957672, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0294, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6829268292682927, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6461538461538462, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8974358974358975, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6857142857142857, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.20302210748195648, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.8258426966292135, |
|
"eval_overall_precision": 0.786096256684492, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.3339, |
|
"eval_samples_per_second": 560.02, |
|
"eval_steps_per_second": 8.984, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.893441915512085, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0282, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6721311475409836, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.640625, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.89171974522293, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7936507936507937, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.20604942739009857, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.829817158931083, |
|
"eval_overall_precision": 0.7908847184986595, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3381, |
|
"eval_samples_per_second": 553.156, |
|
"eval_steps_per_second": 8.874, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 1.8298670053482056, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0298, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6610169491525424, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.6724137931034483, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7741935483870968, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8275862068965517, |
|
"eval_loss": 0.20402812957763672, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.8238636363636365, |
|
"eval_overall_precision": 0.7923497267759563, |
|
"eval_overall_recall": 0.8579881656804734, |
|
"eval_runtime": 0.3363, |
|
"eval_samples_per_second": 556.081, |
|
"eval_steps_per_second": 8.921, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.38677918910980225, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0296, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6991869918699186, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6615384615384615, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.9009584664536742, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.1978691667318344, |
|
"eval_overall_accuracy": 0.9608194622279129, |
|
"eval_overall_f1": 0.8474576271186441, |
|
"eval_overall_precision": 0.8108108108108109, |
|
"eval_overall_recall": 0.8875739644970414, |
|
"eval_runtime": 0.3358, |
|
"eval_samples_per_second": 556.894, |
|
"eval_steps_per_second": 8.934, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.18261797726154327, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0281, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7107438016528926, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6825396825396826, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2115841805934906, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8389830508474576, |
|
"eval_overall_precision": 0.8027027027027027, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3347, |
|
"eval_samples_per_second": 558.764, |
|
"eval_steps_per_second": 8.964, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.5827004909515381, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0285, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6721311475409836, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.640625, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7272727272727272, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7692307692307692, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6944444444444444, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.20784814655780792, |
|
"eval_overall_accuracy": 0.9569782330345711, |
|
"eval_overall_f1": 0.8258426966292135, |
|
"eval_overall_precision": 0.786096256684492, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.3341, |
|
"eval_samples_per_second": 559.746, |
|
"eval_steps_per_second": 8.98, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 0.163285493850708, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0248, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6612903225806452, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6212121212121212, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7352941176470588, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6410256410256411, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.22002604603767395, |
|
"eval_overall_accuracy": 0.9541613316261204, |
|
"eval_overall_f1": 0.8200836820083682, |
|
"eval_overall_precision": 0.7757255936675461, |
|
"eval_overall_recall": 0.8698224852071006, |
|
"eval_runtime": 0.3337, |
|
"eval_samples_per_second": 560.445, |
|
"eval_steps_per_second": 8.991, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.5999857783317566, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.026, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.888888888888889, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8533333333333334, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6451612903225806, |
|
"eval_ORGANIZATION_recall": 0.6896551724137931, |
|
"eval_PERSON_f1": 0.8974358974358975, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.20526228845119476, |
|
"eval_overall_accuracy": 0.9590268886043534, |
|
"eval_overall_f1": 0.8404558404558404, |
|
"eval_overall_precision": 0.8104395604395604, |
|
"eval_overall_recall": 0.8727810650887574, |
|
"eval_runtime": 0.3329, |
|
"eval_samples_per_second": 561.768, |
|
"eval_steps_per_second": 9.012, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.8914698362350464, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0267, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6829268292682927, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6461538461538462, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8980891719745223, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8703703703703703, |
|
"eval_PERSON_recall": 0.9276315789473685, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.20852600038051605, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.8359046283309958, |
|
"eval_overall_precision": 0.7946666666666666, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3353, |
|
"eval_samples_per_second": 557.656, |
|
"eval_steps_per_second": 8.946, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.07933935523033142, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0256, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6774193548387097, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.89171974522293, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21233612298965454, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.8335664335664336, |
|
"eval_overall_precision": 0.7904509283819628, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3363, |
|
"eval_samples_per_second": 556.087, |
|
"eval_steps_per_second": 8.921, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 1.2923147678375244, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0258, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.7, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6774193548387096, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7692307692307692, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6944444444444444, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.20847661793231964, |
|
"eval_overall_accuracy": 0.9572343149807938, |
|
"eval_overall_f1": 0.8338028169014083, |
|
"eval_overall_precision": 0.7956989247311828, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3331, |
|
"eval_samples_per_second": 561.331, |
|
"eval_steps_per_second": 9.005, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.8602144718170166, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0278, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6984126984126984, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.7586206896551724, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.7575757575757576, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6756756756756757, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.2143712192773819, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.829608938547486, |
|
"eval_overall_precision": 0.7857142857142857, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3343, |
|
"eval_samples_per_second": 559.33, |
|
"eval_steps_per_second": 8.973, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 3.9535341262817383, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0266, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.672, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6268656716417911, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7384615384615385, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6857142857142857, |
|
"eval_QUANTITY_recall": 0.8, |
|
"eval_TIME_f1": 0.8253968253968255, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21172450482845306, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.8314606741573034, |
|
"eval_overall_precision": 0.7914438502673797, |
|
"eval_overall_recall": 0.8757396449704142, |
|
"eval_runtime": 0.3355, |
|
"eval_samples_per_second": 557.315, |
|
"eval_steps_per_second": 8.941, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.6084784865379333, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0277, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6774193548387097, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.89171974522293, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21649378538131714, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.8335664335664336, |
|
"eval_overall_precision": 0.7904509283819628, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3329, |
|
"eval_samples_per_second": 561.77, |
|
"eval_steps_per_second": 9.012, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 3.59494686126709, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0263, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6935483870967741, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6515151515151515, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.7692307692307692, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.6944444444444444, |
|
"eval_TIME_recall": 0.8620689655172413, |
|
"eval_loss": 0.21574969589710236, |
|
"eval_overall_accuracy": 0.9572343149807938, |
|
"eval_overall_f1": 0.8284518828451882, |
|
"eval_overall_precision": 0.783641160949868, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.336, |
|
"eval_samples_per_second": 556.623, |
|
"eval_steps_per_second": 8.93, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.6815735697746277, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0249, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.8767123287671235, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8311688311688312, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6307692307692307, |
|
"eval_ORGANIZATION_recall": 0.7068965517241379, |
|
"eval_PERSON_f1": 0.89171974522293, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.8, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7428571428571429, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21547271311283112, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.8342696629213484, |
|
"eval_overall_precision": 0.7941176470588235, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3337, |
|
"eval_samples_per_second": 560.443, |
|
"eval_steps_per_second": 8.991, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.9203242063522339, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.026, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8689655172413793, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8289473684210527, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7575757575757577, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6944444444444444, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8253968253968255, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21566654741764069, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8342696629213484, |
|
"eval_overall_precision": 0.7941176470588235, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3342, |
|
"eval_samples_per_second": 559.523, |
|
"eval_steps_per_second": 8.976, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 1.3422565460205078, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0246, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6935483870967741, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6515151515151515, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.746268656716418, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21777355670928955, |
|
"eval_overall_accuracy": 0.9574903969270167, |
|
"eval_overall_f1": 0.8319327731092437, |
|
"eval_overall_precision": 0.7898936170212766, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3325, |
|
"eval_samples_per_second": 562.463, |
|
"eval_steps_per_second": 9.023, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.5304462909698486, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0228, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6056338028169014, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21389849483966827, |
|
"eval_overall_accuracy": 0.9577464788732394, |
|
"eval_overall_f1": 0.83008356545961, |
|
"eval_overall_precision": 0.7842105263157895, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3334, |
|
"eval_samples_per_second": 560.952, |
|
"eval_steps_per_second": 8.999, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.9430941343307495, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0239, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.863013698630137, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8181818181818182, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8253968253968255, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2171957641839981, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8359046283309958, |
|
"eval_overall_precision": 0.7946666666666666, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3342, |
|
"eval_samples_per_second": 559.517, |
|
"eval_steps_per_second": 8.976, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.5671630501747131, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0246, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.882758620689655, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8421052631578947, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6771653543307088, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6231884057971014, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7761194029850748, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21604588627815247, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.835195530726257, |
|
"eval_overall_precision": 0.791005291005291, |
|
"eval_overall_recall": 0.8846153846153846, |
|
"eval_runtime": 0.3336, |
|
"eval_samples_per_second": 560.484, |
|
"eval_steps_per_second": 8.992, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 2.1864192485809326, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0263, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.888888888888889, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.8533333333333334, |
|
"eval_LOCATION_recall": 0.927536231884058, |
|
"eval_ORGANIZATION_f1": 0.6829268292682927, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6461538461538462, |
|
"eval_ORGANIZATION_recall": 0.7241379310344828, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7692307692307692, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7142857142857143, |
|
"eval_QUANTITY_recall": 0.8333333333333334, |
|
"eval_TIME_f1": 0.8253968253968255, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2144096940755844, |
|
"eval_overall_accuracy": 0.9585147247119078, |
|
"eval_overall_f1": 0.8389830508474576, |
|
"eval_overall_precision": 0.8027027027027027, |
|
"eval_overall_recall": 0.878698224852071, |
|
"eval_runtime": 0.3344, |
|
"eval_samples_per_second": 559.208, |
|
"eval_steps_per_second": 8.971, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.35259944200515747, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0243, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.688, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6417910447761194, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21475861966609955, |
|
"eval_overall_accuracy": 0.9582586427656851, |
|
"eval_overall_f1": 0.8370786516853933, |
|
"eval_overall_precision": 0.7967914438502673, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.3334, |
|
"eval_samples_per_second": 560.934, |
|
"eval_steps_per_second": 8.999, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 1.3611903190612793, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0232, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6935483870967741, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6515151515151515, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.2144315391778946, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8382559774964837, |
|
"eval_overall_precision": 0.7989276139410187, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.334, |
|
"eval_samples_per_second": 559.885, |
|
"eval_steps_per_second": 8.982, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.2549450397491455, |
|
"learning_rate": 0.0, |
|
"loss": 0.0224, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.8749999999999999, |
|
"eval_LOCATION_number": 69, |
|
"eval_LOCATION_precision": 0.84, |
|
"eval_LOCATION_recall": 0.9130434782608695, |
|
"eval_ORGANIZATION_f1": 0.6935483870967741, |
|
"eval_ORGANIZATION_number": 58, |
|
"eval_ORGANIZATION_precision": 0.6515151515151515, |
|
"eval_ORGANIZATION_recall": 0.7413793103448276, |
|
"eval_PERSON_f1": 0.8945686900958467, |
|
"eval_PERSON_number": 152, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9210526315789473, |
|
"eval_QUANTITY_f1": 0.7878787878787877, |
|
"eval_QUANTITY_number": 30, |
|
"eval_QUANTITY_precision": 0.7222222222222222, |
|
"eval_QUANTITY_recall": 0.8666666666666667, |
|
"eval_TIME_f1": 0.8125, |
|
"eval_TIME_number": 29, |
|
"eval_TIME_precision": 0.7428571428571429, |
|
"eval_TIME_recall": 0.896551724137931, |
|
"eval_loss": 0.21471820771694183, |
|
"eval_overall_accuracy": 0.9580025608194622, |
|
"eval_overall_f1": 0.8382559774964837, |
|
"eval_overall_precision": 0.7989276139410187, |
|
"eval_overall_recall": 0.8816568047337278, |
|
"eval_runtime": 0.336, |
|
"eval_samples_per_second": 556.48, |
|
"eval_steps_per_second": 8.927, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 5008141811675874.0, |
|
"train_loss": 0.0706503679617396, |
|
"train_runtime": 608.9849, |
|
"train_samples_per_second": 277.018, |
|
"train_steps_per_second": 17.406 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 5008141811675874.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|