|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 1.4652527570724487, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 1.2491, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.0, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.0, |
|
"eval_PERSON_recall": 0.0, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.7288655042648315, |
|
"eval_overall_accuracy": 0.8365739601279842, |
|
"eval_overall_f1": 0.0, |
|
"eval_overall_precision": 0.0, |
|
"eval_overall_recall": 0.0, |
|
"eval_runtime": 0.9333, |
|
"eval_samples_per_second": 200.373, |
|
"eval_steps_per_second": 3.215, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.179681658744812, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.7042, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.012820512820512822, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.16666666666666666, |
|
"eval_PERSON_recall": 0.006666666666666667, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.6214632391929626, |
|
"eval_overall_accuracy": 0.8375584543440807, |
|
"eval_overall_f1": 0.005586592178770949, |
|
"eval_overall_precision": 0.14285714285714285, |
|
"eval_overall_recall": 0.002849002849002849, |
|
"eval_runtime": 0.9735, |
|
"eval_samples_per_second": 192.098, |
|
"eval_steps_per_second": 3.082, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.2983235120773315, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.6157, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.02631578947368421, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.3333333333333333, |
|
"eval_LOCATION_recall": 0.0136986301369863, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.058823529411764705, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.25, |
|
"eval_PERSON_recall": 0.03333333333333333, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.532402515411377, |
|
"eval_overall_accuracy": 0.8437115431946838, |
|
"eval_overall_f1": 0.03108808290155441, |
|
"eval_overall_precision": 0.17142857142857143, |
|
"eval_overall_recall": 0.017094017094017096, |
|
"eval_runtime": 1.0085, |
|
"eval_samples_per_second": 185.432, |
|
"eval_steps_per_second": 2.975, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.2393027544021606, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.5215, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.16666666666666663, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6363636363636364, |
|
"eval_LOCATION_recall": 0.0958904109589041, |
|
"eval_ORGANIZATION_f1": 0.025, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.06666666666666667, |
|
"eval_ORGANIZATION_recall": 0.015384615384615385, |
|
"eval_PERSON_f1": 0.3102040816326531, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.4, |
|
"eval_PERSON_recall": 0.25333333333333335, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.2692307692307692, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.3888888888888889, |
|
"eval_TIME_recall": 0.20588235294117646, |
|
"eval_loss": 0.4347396790981293, |
|
"eval_overall_accuracy": 0.8707851341373369, |
|
"eval_overall_f1": 0.2163265306122449, |
|
"eval_overall_precision": 0.381294964028777, |
|
"eval_overall_recall": 0.150997150997151, |
|
"eval_runtime": 0.9853, |
|
"eval_samples_per_second": 189.782, |
|
"eval_steps_per_second": 3.045, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.3171206712722778, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.4311, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.38260869565217387, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.5238095238095238, |
|
"eval_LOCATION_recall": 0.3013698630136986, |
|
"eval_ORGANIZATION_f1": 0.17021276595744683, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.27586206896551724, |
|
"eval_ORGANIZATION_recall": 0.12307692307692308, |
|
"eval_PERSON_f1": 0.6098360655737705, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.6, |
|
"eval_PERSON_recall": 0.62, |
|
"eval_QUANTITY_f1": 0.05405405405405405, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.125, |
|
"eval_QUANTITY_recall": 0.034482758620689655, |
|
"eval_TIME_f1": 0.6268656716417911, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6363636363636364, |
|
"eval_TIME_recall": 0.6176470588235294, |
|
"eval_loss": 0.35183095932006836, |
|
"eval_overall_accuracy": 0.9047501845926655, |
|
"eval_overall_f1": 0.46925566343042074, |
|
"eval_overall_precision": 0.5430711610486891, |
|
"eval_overall_recall": 0.4131054131054131, |
|
"eval_runtime": 0.951, |
|
"eval_samples_per_second": 196.64, |
|
"eval_steps_per_second": 3.155, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.2733343839645386, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.3468, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.5165562913907286, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.5, |
|
"eval_LOCATION_recall": 0.5342465753424658, |
|
"eval_ORGANIZATION_f1": 0.39062500000000006, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.3968253968253968, |
|
"eval_ORGANIZATION_recall": 0.38461538461538464, |
|
"eval_PERSON_f1": 0.7823529411764706, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7, |
|
"eval_PERSON_recall": 0.8866666666666667, |
|
"eval_QUANTITY_f1": 0.39999999999999997, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.3870967741935484, |
|
"eval_QUANTITY_recall": 0.41379310344827586, |
|
"eval_TIME_f1": 0.6756756756756757, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.625, |
|
"eval_TIME_recall": 0.7352941176470589, |
|
"eval_loss": 0.29307425022125244, |
|
"eval_overall_accuracy": 0.9237016982525228, |
|
"eval_overall_f1": 0.6215139442231076, |
|
"eval_overall_precision": 0.582089552238806, |
|
"eval_overall_recall": 0.6666666666666666, |
|
"eval_runtime": 0.9368, |
|
"eval_samples_per_second": 199.617, |
|
"eval_steps_per_second": 3.202, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 1.3349977731704712, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.2867, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.6296296296296295, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.5730337078651685, |
|
"eval_LOCATION_recall": 0.6986301369863014, |
|
"eval_ORGANIZATION_f1": 0.4444444444444445, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.4050632911392405, |
|
"eval_ORGANIZATION_recall": 0.49230769230769234, |
|
"eval_PERSON_f1": 0.8179104477611939, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7405405405405405, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.43076923076923074, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.3888888888888889, |
|
"eval_QUANTITY_recall": 0.4827586206896552, |
|
"eval_TIME_f1": 0.7027027027027027, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.65, |
|
"eval_TIME_recall": 0.7647058823529411, |
|
"eval_loss": 0.246965229511261, |
|
"eval_overall_accuracy": 0.9328082697514152, |
|
"eval_overall_f1": 0.6666666666666666, |
|
"eval_overall_precision": 0.6060606060606061, |
|
"eval_overall_recall": 0.7407407407407407, |
|
"eval_runtime": 0.9397, |
|
"eval_samples_per_second": 199.001, |
|
"eval_steps_per_second": 3.193, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 1.5047358274459839, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.2534, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.6380368098159509, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.5777777777777777, |
|
"eval_LOCATION_recall": 0.7123287671232876, |
|
"eval_ORGANIZATION_f1": 0.5070422535211268, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.4675324675324675, |
|
"eval_ORGANIZATION_recall": 0.5538461538461539, |
|
"eval_PERSON_f1": 0.8267477203647415, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7597765363128491, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.4444444444444445, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.4117647058823529, |
|
"eval_QUANTITY_recall": 0.4827586206896552, |
|
"eval_TIME_f1": 0.6933333333333332, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6341463414634146, |
|
"eval_TIME_recall": 0.7647058823529411, |
|
"eval_loss": 0.21960192918777466, |
|
"eval_overall_accuracy": 0.9355156288456805, |
|
"eval_overall_f1": 0.683937823834197, |
|
"eval_overall_precision": 0.6270783847980997, |
|
"eval_overall_recall": 0.7521367521367521, |
|
"eval_runtime": 0.9508, |
|
"eval_samples_per_second": 196.67, |
|
"eval_steps_per_second": 3.155, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 2.822505474090576, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.225, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7239263803680981, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6555555555555556, |
|
"eval_LOCATION_recall": 0.8082191780821918, |
|
"eval_ORGANIZATION_f1": 0.5466666666666666, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.4823529411764706, |
|
"eval_ORGANIZATION_recall": 0.6307692307692307, |
|
"eval_PERSON_f1": 0.8379204892966361, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7740112994350282, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.4444444444444445, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.4117647058823529, |
|
"eval_QUANTITY_recall": 0.4827586206896552, |
|
"eval_TIME_f1": 0.7297297297297296, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.675, |
|
"eval_TIME_recall": 0.7941176470588235, |
|
"eval_loss": 0.19911912083625793, |
|
"eval_overall_accuracy": 0.9404380999261629, |
|
"eval_overall_f1": 0.7155727155727156, |
|
"eval_overall_precision": 0.6525821596244131, |
|
"eval_overall_recall": 0.792022792022792, |
|
"eval_runtime": 0.9711, |
|
"eval_samples_per_second": 192.571, |
|
"eval_steps_per_second": 3.089, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 0.7733340859413147, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.2073, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.7361963190184049, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6666666666666666, |
|
"eval_LOCATION_recall": 0.821917808219178, |
|
"eval_ORGANIZATION_f1": 0.5771812080536913, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5119047619047619, |
|
"eval_ORGANIZATION_recall": 0.6615384615384615, |
|
"eval_PERSON_f1": 0.834355828220859, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7727272727272727, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.4838709677419355, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.45454545454545453, |
|
"eval_QUANTITY_recall": 0.5172413793103449, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.18784372508525848, |
|
"eval_overall_accuracy": 0.9421609648043318, |
|
"eval_overall_f1": 0.7312661498708009, |
|
"eval_overall_precision": 0.6690307328605201, |
|
"eval_overall_recall": 0.8062678062678063, |
|
"eval_runtime": 0.975, |
|
"eval_samples_per_second": 191.794, |
|
"eval_steps_per_second": 3.077, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 1.2668209075927734, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1928, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.738095238095238, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6526315789473685, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.588235294117647, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5113636363636364, |
|
"eval_ORGANIZATION_recall": 0.6923076923076923, |
|
"eval_PERSON_f1": 0.8353658536585366, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7696629213483146, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.5074626865671642, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.4473684210526316, |
|
"eval_QUANTITY_recall": 0.5862068965517241, |
|
"eval_TIME_f1": 0.7631578947368423, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6904761904761905, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.17933246493339539, |
|
"eval_overall_accuracy": 0.94265321191238, |
|
"eval_overall_f1": 0.7323232323232324, |
|
"eval_overall_precision": 0.6575963718820862, |
|
"eval_overall_recall": 0.8262108262108262, |
|
"eval_runtime": 0.9501, |
|
"eval_samples_per_second": 196.821, |
|
"eval_steps_per_second": 3.158, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.7145781517028809, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1834, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.738095238095238, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6526315789473685, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6114649681528661, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5217391304347826, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8369230769230769, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7771428571428571, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.5373134328358208, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.47368421052631576, |
|
"eval_QUANTITY_recall": 0.6206896551724138, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.17776605486869812, |
|
"eval_overall_accuracy": 0.9428993354664041, |
|
"eval_overall_f1": 0.7414880201765448, |
|
"eval_overall_precision": 0.665158371040724, |
|
"eval_overall_recall": 0.8376068376068376, |
|
"eval_runtime": 0.9578, |
|
"eval_samples_per_second": 195.239, |
|
"eval_steps_per_second": 3.132, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.8720563054084778, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.172, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.7469879518072289, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6666666666666666, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6143790849673202, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5340909090909091, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8421052631578947, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7861271676300579, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.5588235294117647, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.48717948717948717, |
|
"eval_QUANTITY_recall": 0.6551724137931034, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1679297238588333, |
|
"eval_overall_accuracy": 0.9458528181146936, |
|
"eval_overall_f1": 0.7480916030534351, |
|
"eval_overall_precision": 0.6758620689655173, |
|
"eval_overall_recall": 0.8376068376068376, |
|
"eval_runtime": 0.9625, |
|
"eval_samples_per_second": 194.292, |
|
"eval_steps_per_second": 3.117, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.491217851638794, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.171, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.7654320987654321, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6966292134831461, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6496815286624205, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5543478260869565, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8411214953271027, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7894736842105263, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.5588235294117647, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.48717948717948717, |
|
"eval_QUANTITY_recall": 0.6551724137931034, |
|
"eval_TIME_f1": 0.7792207792207793, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6976744186046512, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.16589853167533875, |
|
"eval_overall_accuracy": 0.9456066945606695, |
|
"eval_overall_f1": 0.756687898089172, |
|
"eval_overall_precision": 0.684331797235023, |
|
"eval_overall_recall": 0.8461538461538461, |
|
"eval_runtime": 0.9481, |
|
"eval_samples_per_second": 197.228, |
|
"eval_steps_per_second": 3.164, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.3357112407684326, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1631, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.7411764705882353, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6494845360824743, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6274509803921569, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5454545454545454, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8509316770186336, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7965116279069767, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6268656716417911, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5526315789473685, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.7792207792207793, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6976744186046512, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.16929781436920166, |
|
"eval_overall_accuracy": 0.9451144474526212, |
|
"eval_overall_f1": 0.7579214195183777, |
|
"eval_overall_precision": 0.682648401826484, |
|
"eval_overall_recall": 0.8518518518518519, |
|
"eval_runtime": 0.955, |
|
"eval_samples_per_second": 195.82, |
|
"eval_steps_per_second": 3.141, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 1.694993257522583, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1579, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.75, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.6631578947368421, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6233766233766234, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5393258426966292, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8553459119496856, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8095238095238095, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.6086956521739131, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.525, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.7692307692307693, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6818181818181818, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.16372992098331451, |
|
"eval_overall_accuracy": 0.9475756829928624, |
|
"eval_overall_f1": 0.7573062261753494, |
|
"eval_overall_precision": 0.6834862385321101, |
|
"eval_overall_recall": 0.8490028490028491, |
|
"eval_runtime": 1.042, |
|
"eval_samples_per_second": 179.466, |
|
"eval_steps_per_second": 2.879, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 2.6867129802703857, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.1558, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.7730061349693251, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6289308176100629, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5319148936170213, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8500000000000001, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.5797101449275363, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5, |
|
"eval_QUANTITY_recall": 0.6896551724137931, |
|
"eval_TIME_f1": 0.7792207792207793, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6976744186046512, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.15953023731708527, |
|
"eval_overall_accuracy": 0.9485601772089589, |
|
"eval_overall_f1": 0.7588832487309645, |
|
"eval_overall_precision": 0.6842105263157895, |
|
"eval_overall_recall": 0.8518518518518519, |
|
"eval_runtime": 0.9584, |
|
"eval_samples_per_second": 195.113, |
|
"eval_steps_per_second": 3.13, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 1.2975411415100098, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.15, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.7901234567901235, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7191011235955056, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5882352941176471, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8544303797468354, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8132530120481928, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6060606060606061, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5405405405405406, |
|
"eval_QUANTITY_recall": 0.6896551724137931, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1525745838880539, |
|
"eval_overall_accuracy": 0.950775289195176, |
|
"eval_overall_f1": 0.7766233766233767, |
|
"eval_overall_precision": 0.7136038186157518, |
|
"eval_overall_recall": 0.8518518518518519, |
|
"eval_runtime": 0.9603, |
|
"eval_samples_per_second": 194.722, |
|
"eval_steps_per_second": 3.124, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.9000276923179626, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.1469, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.7901234567901235, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7191011235955056, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.638036809815951, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5306122448979592, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8544303797468354, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8132530120481928, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.15378721058368683, |
|
"eval_overall_accuracy": 0.9502830420871278, |
|
"eval_overall_f1": 0.7739463601532567, |
|
"eval_overall_precision": 0.7013888888888888, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.9594, |
|
"eval_samples_per_second": 194.917, |
|
"eval_steps_per_second": 3.127, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 1.5783941745758057, |
|
"learning_rate": 4e-05, |
|
"loss": 0.1429, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6621621621621622, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5903614457831325, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8544303797468354, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8132530120481928, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6268656716417911, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5526315789473685, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1472158133983612, |
|
"eval_overall_accuracy": 0.9524981540733448, |
|
"eval_overall_f1": 0.7780678851174936, |
|
"eval_overall_precision": 0.7180722891566265, |
|
"eval_overall_recall": 0.8490028490028491, |
|
"eval_runtime": 0.9598, |
|
"eval_samples_per_second": 194.837, |
|
"eval_steps_per_second": 3.126, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 2.0488758087158203, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.1419, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5882352941176471, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8598726114649682, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.823170731707317, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6567164179104478, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5789473684210527, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7692307692307693, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6818181818181818, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14743593335151672, |
|
"eval_overall_accuracy": 0.9524981540733448, |
|
"eval_overall_f1": 0.7802340702210663, |
|
"eval_overall_precision": 0.7177033492822966, |
|
"eval_overall_recall": 0.8547008547008547, |
|
"eval_runtime": 0.9574, |
|
"eval_samples_per_second": 195.324, |
|
"eval_steps_per_second": 3.134, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 1.5187019109725952, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.1365, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.7926829268292682, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8904109589041096, |
|
"eval_ORGANIZATION_f1": 0.6455696202531646, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5483870967741935, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8860759493670886, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8433734939759037, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.7594936708860759, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.15414337813854218, |
|
"eval_overall_accuracy": 0.9517597834112724, |
|
"eval_overall_f1": 0.788265306122449, |
|
"eval_overall_precision": 0.7136258660508084, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.9544, |
|
"eval_samples_per_second": 195.93, |
|
"eval_steps_per_second": 3.143, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 2.007498025894165, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.1356, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.7950310559006212, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7272727272727273, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6493506493506495, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5617977528089888, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8634920634920634, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8242424242424242, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1455027163028717, |
|
"eval_overall_accuracy": 0.9534826482894413, |
|
"eval_overall_f1": 0.7859922178988327, |
|
"eval_overall_precision": 0.7214285714285714, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.9568, |
|
"eval_samples_per_second": 195.44, |
|
"eval_steps_per_second": 3.135, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 1.5448315143585205, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.1326, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.7878787878787878, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7065217391304348, |
|
"eval_LOCATION_recall": 0.8904109589041096, |
|
"eval_ORGANIZATION_f1": 0.6496815286624205, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5543478260869565, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8761904761904761, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8363636363636363, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.7692307692307693, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6818181818181818, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.15045028924942017, |
|
"eval_overall_accuracy": 0.9522520305193207, |
|
"eval_overall_f1": 0.7841634738186462, |
|
"eval_overall_precision": 0.7106481481481481, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9528, |
|
"eval_samples_per_second": 196.256, |
|
"eval_steps_per_second": 3.148, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 1.4791549444198608, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.13, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.7926829268292682, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8904109589041096, |
|
"eval_ORGANIZATION_f1": 0.6490066225165563, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5697674418604651, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5897435897435898, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.7692307692307693, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6818181818181818, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1473151594400406, |
|
"eval_overall_accuracy": 0.9529904011813931, |
|
"eval_overall_f1": 0.7870967741935483, |
|
"eval_overall_precision": 0.7193396226415094, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9439, |
|
"eval_samples_per_second": 198.109, |
|
"eval_steps_per_second": 3.178, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 1.8120989799499512, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.1321, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6619718309859155, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6103896103896104, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14089035987854004, |
|
"eval_overall_accuracy": 0.9552055131676102, |
|
"eval_overall_f1": 0.7941567065073041, |
|
"eval_overall_precision": 0.7437810945273632, |
|
"eval_overall_recall": 0.8518518518518519, |
|
"eval_runtime": 0.9518, |
|
"eval_samples_per_second": 196.471, |
|
"eval_steps_per_second": 3.152, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.6371389031410217, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.1272, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6438356164383562, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5802469135802469, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.7692307692307693, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6818181818181818, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14270104467868805, |
|
"eval_overall_accuracy": 0.9547132660595619, |
|
"eval_overall_f1": 0.7916120576671035, |
|
"eval_overall_precision": 0.7330097087378641, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.9626, |
|
"eval_samples_per_second": 194.265, |
|
"eval_steps_per_second": 3.117, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 1.3416866064071655, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.1278, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6530612244897959, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5853658536585366, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6268656716417911, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5526315789473685, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.7792207792207793, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6976744186046512, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14526282250881195, |
|
"eval_overall_accuracy": 0.9527442776273689, |
|
"eval_overall_f1": 0.787958115183246, |
|
"eval_overall_precision": 0.7288135593220338, |
|
"eval_overall_recall": 0.8575498575498576, |
|
"eval_runtime": 1.0218, |
|
"eval_samples_per_second": 183.002, |
|
"eval_steps_per_second": 2.936, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 1.6158010959625244, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.1242, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.779874213836478, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5795454545454546, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6176470588235294, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5384615384615384, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.7792207792207793, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6976744186046512, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14530108869075775, |
|
"eval_overall_accuracy": 0.9539748953974896, |
|
"eval_overall_f1": 0.7844155844155845, |
|
"eval_overall_precision": 0.720763723150358, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.9579, |
|
"eval_samples_per_second": 195.225, |
|
"eval_steps_per_second": 3.132, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 1.2722007036209106, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.1208, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.802547770700637, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6713286713286714, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6153846153846154, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6363636363636365, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5675675675675675, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8108108108108107, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13934831321239471, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.7952127659574469, |
|
"eval_overall_precision": 0.7456359102244389, |
|
"eval_overall_recall": 0.8518518518518519, |
|
"eval_runtime": 0.9579, |
|
"eval_samples_per_second": 195.229, |
|
"eval_steps_per_second": 3.132, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.45983773469924927, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.1213, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8050314465408805, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7441860465116279, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6455696202531646, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5483870967741935, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.6470588235294118, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5641025641025641, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7435897435897436, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6590909090909091, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14607404172420502, |
|
"eval_overall_accuracy": 0.9532365247354172, |
|
"eval_overall_f1": 0.7803617571059431, |
|
"eval_overall_precision": 0.7139479905437353, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.9648, |
|
"eval_samples_per_second": 193.817, |
|
"eval_steps_per_second": 3.109, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.30338501930236816, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.1181, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.8050314465408805, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7441860465116279, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6623376623376623, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5730337078651685, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6268656716417911, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5526315789473685, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.7837837837837837, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.725, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14169462025165558, |
|
"eval_overall_accuracy": 0.9556977602756583, |
|
"eval_overall_f1": 0.7911227154046997, |
|
"eval_overall_precision": 0.7301204819277108, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.9599, |
|
"eval_samples_per_second": 194.803, |
|
"eval_steps_per_second": 3.125, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 1.1467270851135254, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.1191, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8101265822784809, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6493506493506495, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5617977528089888, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6567164179104478, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5789473684210527, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7631578947368423, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6904761904761905, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1409684270620346, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.788036410923277, |
|
"eval_overall_precision": 0.7248803827751196, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 1.0374, |
|
"eval_samples_per_second": 180.261, |
|
"eval_steps_per_second": 2.892, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 1.4821702241897583, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.1156, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.735632183908046, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6577181208053692, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5833333333333334, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6470588235294118, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5641025641025641, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14082583785057068, |
|
"eval_overall_accuracy": 0.9556977602756583, |
|
"eval_overall_f1": 0.7905759162303665, |
|
"eval_overall_precision": 0.7312348668280871, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.9851, |
|
"eval_samples_per_second": 189.819, |
|
"eval_steps_per_second": 3.045, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 1.1249200105667114, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.1159, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.735632183908046, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6622516556291391, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5813953488372093, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6470588235294118, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5641025641025641, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7532467532467532, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6744186046511628, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14301134645938873, |
|
"eval_overall_accuracy": 0.9542210189515137, |
|
"eval_overall_f1": 0.7896103896103895, |
|
"eval_overall_precision": 0.7255369928400954, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.961, |
|
"eval_samples_per_second": 194.591, |
|
"eval_steps_per_second": 3.122, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.991729736328125, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.1133, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.802547770700637, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6577181208053692, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5833333333333334, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7894736842105262, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13775944709777832, |
|
"eval_overall_accuracy": 0.9559438838296825, |
|
"eval_overall_f1": 0.7921052631578948, |
|
"eval_overall_precision": 0.7359413202933985, |
|
"eval_overall_recall": 0.8575498575498576, |
|
"eval_runtime": 0.9576, |
|
"eval_samples_per_second": 195.271, |
|
"eval_steps_per_second": 3.133, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 0.8443315625190735, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.1141, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6582278481012658, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5591397849462365, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6376811594202898, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.55, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7435897435897436, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6590909090909091, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1476057767868042, |
|
"eval_overall_accuracy": 0.9529904011813931, |
|
"eval_overall_f1": 0.7846153846153847, |
|
"eval_overall_precision": 0.7132867132867133, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9555, |
|
"eval_samples_per_second": 195.718, |
|
"eval_steps_per_second": 3.14, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.8820420503616333, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.1131, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6619718309859155, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6103896103896104, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8917197452229298, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8108108108108107, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13637974858283997, |
|
"eval_overall_accuracy": 0.9571745015998031, |
|
"eval_overall_f1": 0.8031914893617021, |
|
"eval_overall_precision": 0.7531172069825436, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.9776, |
|
"eval_samples_per_second": 191.287, |
|
"eval_steps_per_second": 3.069, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 7.688674449920654, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.1107, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.7950310559006212, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7272727272727273, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6624203821656051, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5652173913043478, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6470588235294118, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5641025641025641, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7532467532467532, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.6744186046511628, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.14455579221248627, |
|
"eval_overall_accuracy": 0.9542210189515137, |
|
"eval_overall_f1": 0.7892030848329049, |
|
"eval_overall_precision": 0.7189695550351288, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9611, |
|
"eval_samples_per_second": 194.572, |
|
"eval_steps_per_second": 3.121, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.7613418698310852, |
|
"learning_rate": 3e-05, |
|
"loss": 0.1096, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5795454545454546, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.1409280002117157, |
|
"eval_overall_accuracy": 0.9554516367216342, |
|
"eval_overall_f1": 0.7958115183246073, |
|
"eval_overall_precision": 0.7360774818401937, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.953, |
|
"eval_samples_per_second": 196.217, |
|
"eval_steps_per_second": 3.148, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.5511670112609863, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.1076, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6799999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.7733333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7073170731707317, |
|
"eval_TIME_recall": 0.8529411764705882, |
|
"eval_loss": 0.13955771923065186, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.8015768725361366, |
|
"eval_overall_precision": 0.7439024390243902, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9543, |
|
"eval_samples_per_second": 195.951, |
|
"eval_steps_per_second": 3.144, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.7491174340248108, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.1074, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.675496688741722, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5930232558139535, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6376811594202898, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.55, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14121000468730927, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.7953063885267275, |
|
"eval_overall_precision": 0.7331730769230769, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9549, |
|
"eval_samples_per_second": 195.829, |
|
"eval_steps_per_second": 3.142, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 3.582904100418091, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.1068, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6714285714285715, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6266666666666667, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1361449509859085, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.802124833997344, |
|
"eval_overall_precision": 0.7512437810945274, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.9551, |
|
"eval_samples_per_second": 195.788, |
|
"eval_steps_per_second": 3.141, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 2.657741069793701, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.1067, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6853146853146853, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6282051282051282, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.879746835443038, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8373493975903614, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8493150684931507, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7948717948717948, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13337016105651855, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8047808764940239, |
|
"eval_overall_precision": 0.753731343283582, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.9555, |
|
"eval_samples_per_second": 195.712, |
|
"eval_steps_per_second": 3.14, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 3.083543300628662, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.1053, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6799999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8917197452229298, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1369679719209671, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8068331143232589, |
|
"eval_overall_precision": 0.748780487804878, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9521, |
|
"eval_samples_per_second": 196.405, |
|
"eval_steps_per_second": 3.151, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 1.343135952949524, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.1028, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6802721088435374, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6097560975609756, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8493150684931507, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7948717948717948, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13157421350479126, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8154050464807436, |
|
"eval_overall_precision": 0.763681592039801, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9587, |
|
"eval_samples_per_second": 195.059, |
|
"eval_steps_per_second": 3.129, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 2.0871903896331787, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.1061, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6666666666666666, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6075949367088608, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1331242024898529, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8042328042328044, |
|
"eval_overall_precision": 0.7506172839506173, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9613, |
|
"eval_samples_per_second": 194.534, |
|
"eval_steps_per_second": 3.121, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 11.59224796295166, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.104, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6845637583892618, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6071428571428571, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8917197452229298, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13441863656044006, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8052631578947369, |
|
"eval_overall_precision": 0.7481662591687042, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9557, |
|
"eval_samples_per_second": 195.663, |
|
"eval_steps_per_second": 3.139, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.8353492617607117, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.1025, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.802547770700637, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5882352941176471, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13503114879131317, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.8010540184453229, |
|
"eval_overall_precision": 0.7450980392156863, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.959, |
|
"eval_samples_per_second": 194.987, |
|
"eval_steps_per_second": 3.128, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 1.756870150566101, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.1032, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.802547770700637, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6758620689655173, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6125, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6567164179104478, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5789473684210527, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13715174794197083, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.8010540184453229, |
|
"eval_overall_precision": 0.7450980392156863, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9565, |
|
"eval_samples_per_second": 195.497, |
|
"eval_steps_per_second": 3.136, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 1.03740656375885, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0993, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.7924528301886793, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6442953020134228, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5714285714285714, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1355990171432495, |
|
"eval_overall_accuracy": 0.9556977602756583, |
|
"eval_overall_f1": 0.7900262467191601, |
|
"eval_overall_precision": 0.732360097323601, |
|
"eval_overall_recall": 0.8575498575498576, |
|
"eval_runtime": 0.9593, |
|
"eval_samples_per_second": 194.924, |
|
"eval_steps_per_second": 3.127, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 1.2626599073410034, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0992, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6906474820143885, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6486486486486487, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6567164179104478, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5789473684210527, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13695622980594635, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.803713527851459, |
|
"eval_overall_precision": 0.7518610421836228, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.9565, |
|
"eval_samples_per_second": 195.512, |
|
"eval_steps_per_second": 3.137, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 1.9839859008789062, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0994, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.7875, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6753246753246754, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5842696629213483, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14013363420963287, |
|
"eval_overall_accuracy": 0.9571745015998031, |
|
"eval_overall_f1": 0.796875, |
|
"eval_overall_precision": 0.7338129496402878, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9547, |
|
"eval_samples_per_second": 195.863, |
|
"eval_steps_per_second": 3.142, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 1.7605901956558228, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0993, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.802547770700637, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5795454545454546, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1363925337791443, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.8010471204188482, |
|
"eval_overall_precision": 0.7409200968523002, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9561, |
|
"eval_samples_per_second": 195.585, |
|
"eval_steps_per_second": 3.138, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 1.1708297729492188, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0971, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.8101265822784809, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.8767123287671232, |
|
"eval_ORGANIZATION_f1": 0.6322580645161291, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5444444444444444, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.14004166424274445, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.7926988265971318, |
|
"eval_overall_precision": 0.7307692307692307, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.958, |
|
"eval_samples_per_second": 195.201, |
|
"eval_steps_per_second": 3.132, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 2.4600577354431152, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.1, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.802547770700637, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6490066225165563, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5697674418604651, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1348854899406433, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.7968545216251638, |
|
"eval_overall_precision": 0.7378640776699029, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9627, |
|
"eval_samples_per_second": 194.255, |
|
"eval_steps_per_second": 3.116, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 1.6444453001022339, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0987, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.7924528301886793, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6712328767123288, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6049382716049383, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.1363009363412857, |
|
"eval_overall_accuracy": 0.9561900073837066, |
|
"eval_overall_f1": 0.7984189723320159, |
|
"eval_overall_precision": 0.7426470588235294, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.9591, |
|
"eval_samples_per_second": 194.968, |
|
"eval_steps_per_second": 3.128, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.6375830173492432, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0976, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6714285714285715, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6266666666666667, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1327548623085022, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8074866310160427, |
|
"eval_overall_precision": 0.760705289672544, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.9623, |
|
"eval_samples_per_second": 194.331, |
|
"eval_steps_per_second": 3.118, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 2.3580222129821777, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0957, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6666666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.618421052631579, |
|
"eval_ORGANIZATION_recall": 0.7230769230769231, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6461538461538462, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.132992684841156, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8, |
|
"eval_overall_precision": 0.7518796992481203, |
|
"eval_overall_recall": 0.8547008547008547, |
|
"eval_runtime": 0.9558, |
|
"eval_samples_per_second": 195.648, |
|
"eval_steps_per_second": 3.139, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 1.589872121810913, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0953, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6799999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13459840416908264, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8073878627968336, |
|
"eval_overall_precision": 0.7518427518427518, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9605, |
|
"eval_samples_per_second": 194.682, |
|
"eval_steps_per_second": 3.123, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.7457832098007202, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0961, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7042253521126761, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6493506493506493, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1298547387123108, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8170894526034712, |
|
"eval_overall_precision": 0.7688442211055276, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9648, |
|
"eval_samples_per_second": 193.828, |
|
"eval_steps_per_second": 3.11, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 1.4289331436157227, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0951, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.779874213836478, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7083333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6455696202531646, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6567164179104478, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5789473684210527, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7317073170731707, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13753055036067963, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.7994722955145119, |
|
"eval_overall_precision": 0.7444717444717445, |
|
"eval_overall_recall": 0.8632478632478633, |
|
"eval_runtime": 0.9627, |
|
"eval_samples_per_second": 194.239, |
|
"eval_steps_per_second": 3.116, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 5.174590587615967, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0935, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6938775510204082, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6219512195121951, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1345466524362564, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.8089591567852439, |
|
"eval_overall_precision": 0.7524509803921569, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9663, |
|
"eval_samples_per_second": 193.531, |
|
"eval_steps_per_second": 3.105, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 1.1309547424316406, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0932, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6857142857142857, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.64, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6461538461538462, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13020634651184082, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8096514745308312, |
|
"eval_overall_precision": 0.7645569620253164, |
|
"eval_overall_recall": 0.8603988603988604, |
|
"eval_runtime": 0.9602, |
|
"eval_samples_per_second": 194.76, |
|
"eval_steps_per_second": 3.124, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.1441256999969482, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0941, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7042253521126761, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6493506493506493, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1337554007768631, |
|
"eval_overall_accuracy": 0.9571745015998031, |
|
"eval_overall_f1": 0.8127490039840637, |
|
"eval_overall_precision": 0.7611940298507462, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9524, |
|
"eval_samples_per_second": 196.337, |
|
"eval_steps_per_second": 3.15, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 1.6348956823349, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0909, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.697986577181208, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6190476190476191, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.888178913738019, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.852760736196319, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6865671641791046, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6052631578947368, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8266666666666665, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7560975609756098, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1356654316186905, |
|
"eval_overall_accuracy": 0.956928378045779, |
|
"eval_overall_f1": 0.8068331143232589, |
|
"eval_overall_precision": 0.748780487804878, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9599, |
|
"eval_samples_per_second": 194.806, |
|
"eval_steps_per_second": 3.125, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 1.053985595703125, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0912, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7123287671232877, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6419753086419753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13525572419166565, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.8153034300791556, |
|
"eval_overall_precision": 0.7592137592137592, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.97, |
|
"eval_samples_per_second": 192.79, |
|
"eval_steps_per_second": 3.093, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 1.5947766304016113, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0903, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.7770700636942677, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7234042553191491, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6710526315789473, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8421052631578947, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7619047619047619, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13356442749500275, |
|
"eval_overall_accuracy": 0.9576667487078513, |
|
"eval_overall_f1": 0.8133333333333332, |
|
"eval_overall_precision": 0.7644110275689223, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9656, |
|
"eval_samples_per_second": 193.666, |
|
"eval_steps_per_second": 3.107, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 1.0522669553756714, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0912, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6933333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.611764705882353, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13284043967723846, |
|
"eval_overall_accuracy": 0.9579128722618755, |
|
"eval_overall_f1": 0.8174603174603174, |
|
"eval_overall_precision": 0.762962962962963, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.9644, |
|
"eval_samples_per_second": 193.907, |
|
"eval_steps_per_second": 3.111, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.6589028835296631, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0902, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.7999999999999999, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.6950354609929077, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6447368421052632, |
|
"eval_ORGANIZATION_recall": 0.7538461538461538, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13150876760482788, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8165997322623829, |
|
"eval_overall_precision": 0.7702020202020202, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9609, |
|
"eval_samples_per_second": 194.607, |
|
"eval_steps_per_second": 3.122, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 1.6209025382995605, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0908, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.779874213836478, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7074829931972789, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6341463414634146, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13572926819324493, |
|
"eval_overall_accuracy": 0.9566822544917548, |
|
"eval_overall_f1": 0.8063241106719368, |
|
"eval_overall_precision": 0.75, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9565, |
|
"eval_samples_per_second": 195.501, |
|
"eval_steps_per_second": 3.136, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 1.03559410572052, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0897, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7042253521126761, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6493506493506493, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6461538461538462, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8533333333333334, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7804878048780488, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13340426981449127, |
|
"eval_overall_accuracy": 0.9574206251538272, |
|
"eval_overall_f1": 0.8106666666666666, |
|
"eval_overall_precision": 0.7619047619047619, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9726, |
|
"eval_samples_per_second": 192.276, |
|
"eval_steps_per_second": 3.085, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.4955795407295227, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0896, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7034482758620688, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6375, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1333453506231308, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8143236074270558, |
|
"eval_overall_precision": 0.7617866004962779, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9636, |
|
"eval_samples_per_second": 194.067, |
|
"eval_steps_per_second": 3.113, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.707966685295105, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0882, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.6906474820143885, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6486486486486487, |
|
"eval_ORGANIZATION_recall": 0.7384615384615385, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1297333836555481, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8150134048257373, |
|
"eval_overall_precision": 0.769620253164557, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9528, |
|
"eval_samples_per_second": 196.262, |
|
"eval_steps_per_second": 3.149, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.7755259275436401, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0895, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13311755657196045, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8186666666666667, |
|
"eval_overall_precision": 0.7694235588972431, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9564, |
|
"eval_samples_per_second": 195.535, |
|
"eval_steps_per_second": 3.137, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 4.219042778015137, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0888, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.7922077922077922, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7083333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6455696202531646, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6461538461538462, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.7241379310344828, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.1329285353422165, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8128342245989305, |
|
"eval_overall_precision": 0.7657430730478589, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9598, |
|
"eval_samples_per_second": 194.825, |
|
"eval_steps_per_second": 3.126, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 2.975076675415039, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0879, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7042253521126761, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6493506493506493, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13204999268054962, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8155080213903743, |
|
"eval_overall_precision": 0.7682619647355163, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 1.0462, |
|
"eval_samples_per_second": 178.743, |
|
"eval_steps_per_second": 2.868, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 1.8520476818084717, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0869, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7042253521126761, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6493506493506493, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13332289457321167, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8117489986648865, |
|
"eval_overall_precision": 0.7638190954773869, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.958, |
|
"eval_samples_per_second": 195.208, |
|
"eval_steps_per_second": 3.132, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 1.4421206712722778, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0901, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.7974683544303799, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.863013698630137, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8157894736842106, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7380952380952381, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1383257359266281, |
|
"eval_overall_accuracy": 0.9574206251538272, |
|
"eval_overall_f1": 0.8131578947368421, |
|
"eval_overall_precision": 0.7555012224938875, |
|
"eval_overall_recall": 0.8803418803418803, |
|
"eval_runtime": 0.9652, |
|
"eval_samples_per_second": 193.746, |
|
"eval_steps_per_second": 3.108, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 1.3702669143676758, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0871, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7323943661971831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6753246753246753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13473859429359436, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.8160000000000001, |
|
"eval_overall_precision": 0.7669172932330827, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9538, |
|
"eval_samples_per_second": 196.051, |
|
"eval_steps_per_second": 3.145, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 2.0529441833496094, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0851, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7323943661971831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6753246753246753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13238033652305603, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8197596795727637, |
|
"eval_overall_precision": 0.7713567839195979, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9602, |
|
"eval_samples_per_second": 194.754, |
|
"eval_steps_per_second": 3.124, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 2.319127321243286, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0861, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7323943661971831, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6753246753246753, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13330510258674622, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8197596795727637, |
|
"eval_overall_precision": 0.7713567839195979, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 1.0386, |
|
"eval_samples_per_second": 180.057, |
|
"eval_steps_per_second": 2.889, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 1.1554148197174072, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0877, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7412587412587412, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6794871794871795, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8493150684931507, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.7948717948717948, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1339869350194931, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8197596795727637, |
|
"eval_overall_precision": 0.7713567839195979, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9521, |
|
"eval_samples_per_second": 196.415, |
|
"eval_steps_per_second": 3.151, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 1.0138518810272217, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0873, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13319392502307892, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8197596795727637, |
|
"eval_overall_precision": 0.7713567839195979, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9541, |
|
"eval_samples_per_second": 196.006, |
|
"eval_steps_per_second": 3.144, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 1.4809114933013916, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0878, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.7848101265822783, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7412587412587412, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6794871794871795, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.5945945945945946, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8108108108108107, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8823529411764706, |
|
"eval_loss": 0.13555191457271576, |
|
"eval_overall_accuracy": 0.9581589958158996, |
|
"eval_overall_f1": 0.8138297872340426, |
|
"eval_overall_precision": 0.7630922693266833, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9587, |
|
"eval_samples_per_second": 195.046, |
|
"eval_steps_per_second": 3.129, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.6918728947639465, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0854, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7076923076923076, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6388888888888888, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13175515830516815, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8192771084337349, |
|
"eval_overall_precision": 0.7727272727272727, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9509, |
|
"eval_samples_per_second": 196.659, |
|
"eval_steps_per_second": 3.155, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 1.3241691589355469, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0848, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.696969696969697, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6216216216216216, |
|
"eval_QUANTITY_recall": 0.7931034482758621, |
|
"eval_TIME_f1": 0.8648648648648648, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.9411764705882353, |
|
"eval_loss": 0.13328462839126587, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8186666666666667, |
|
"eval_overall_precision": 0.7694235588972431, |
|
"eval_overall_recall": 0.8746438746438746, |
|
"eval_runtime": 0.9604, |
|
"eval_samples_per_second": 194.71, |
|
"eval_steps_per_second": 3.124, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 1.2514363527297974, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0841, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1320430040359497, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.814419225634179, |
|
"eval_overall_precision": 0.7663316582914573, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9664, |
|
"eval_samples_per_second": 193.506, |
|
"eval_steps_per_second": 3.104, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 1.3548272848129272, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0868, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13209053874015808, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.814419225634179, |
|
"eval_overall_precision": 0.7663316582914573, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9587, |
|
"eval_samples_per_second": 195.062, |
|
"eval_steps_per_second": 3.129, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 2.0916614532470703, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0844, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13177448511123657, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8128342245989305, |
|
"eval_overall_precision": 0.7657430730478589, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 1.0153, |
|
"eval_samples_per_second": 184.182, |
|
"eval_steps_per_second": 2.955, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 2.0040924549102783, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0838, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13262386620044708, |
|
"eval_overall_accuracy": 0.9591434900319961, |
|
"eval_overall_f1": 0.8160000000000001, |
|
"eval_overall_precision": 0.7669172932330827, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9604, |
|
"eval_samples_per_second": 194.708, |
|
"eval_steps_per_second": 3.124, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 1.6822946071624756, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0866, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.7898089171974523, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8493150684931506, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.133206307888031, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8160000000000001, |
|
"eval_overall_precision": 0.7669172932330827, |
|
"eval_overall_recall": 0.8717948717948718, |
|
"eval_runtime": 0.9555, |
|
"eval_samples_per_second": 195.706, |
|
"eval_steps_per_second": 3.14, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.4100649654865265, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.085, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1316729038953781, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.8139223560910307, |
|
"eval_overall_precision": 0.7676767676767676, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9566, |
|
"eval_samples_per_second": 195.484, |
|
"eval_steps_per_second": 3.136, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 4.882697582244873, |
|
"learning_rate": 3e-06, |
|
"loss": 0.084, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1321730613708496, |
|
"eval_overall_accuracy": 0.958897366477972, |
|
"eval_overall_f1": 0.814419225634179, |
|
"eval_overall_precision": 0.7663316582914573, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9581, |
|
"eval_samples_per_second": 195.183, |
|
"eval_steps_per_second": 3.131, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 1.8372896909713745, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0838, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13190868496894836, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.814419225634179, |
|
"eval_overall_precision": 0.7663316582914573, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 0.9655, |
|
"eval_samples_per_second": 193.678, |
|
"eval_steps_per_second": 3.107, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 1.2674877643585205, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.087, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13277865946292877, |
|
"eval_overall_accuracy": 0.9584051193699237, |
|
"eval_overall_f1": 0.814419225634179, |
|
"eval_overall_precision": 0.7663316582914573, |
|
"eval_overall_recall": 0.8689458689458689, |
|
"eval_runtime": 1.1022, |
|
"eval_samples_per_second": 169.654, |
|
"eval_steps_per_second": 2.722, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.8085970878601074, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0832, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.131379634141922, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8139223560910307, |
|
"eval_overall_precision": 0.7676767676767676, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9613, |
|
"eval_samples_per_second": 194.531, |
|
"eval_steps_per_second": 3.121, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 1.0001689195632935, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0859, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.7870967741935484, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13154591619968414, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8139223560910307, |
|
"eval_overall_precision": 0.7676767676767676, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9546, |
|
"eval_samples_per_second": 195.886, |
|
"eval_steps_per_second": 3.143, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.9420944452285767, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0838, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.13177190721035004, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8128342245989305, |
|
"eval_overall_precision": 0.7657430730478589, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9644, |
|
"eval_samples_per_second": 193.898, |
|
"eval_steps_per_second": 3.111, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.9724701046943665, |
|
"learning_rate": 0.0, |
|
"loss": 0.0849, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.7820512820512822, |
|
"eval_LOCATION_number": 73, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8356164383561644, |
|
"eval_ORGANIZATION_f1": 0.7183098591549296, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6623376623376623, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.676923076923077, |
|
"eval_QUANTITY_number": 29, |
|
"eval_QUANTITY_precision": 0.6111111111111112, |
|
"eval_QUANTITY_recall": 0.7586206896551724, |
|
"eval_TIME_f1": 0.8378378378378379, |
|
"eval_TIME_number": 34, |
|
"eval_TIME_precision": 0.775, |
|
"eval_TIME_recall": 0.9117647058823529, |
|
"eval_loss": 0.1317785680294037, |
|
"eval_overall_accuracy": 0.9586512429239479, |
|
"eval_overall_f1": 0.8128342245989305, |
|
"eval_overall_precision": 0.7657430730478589, |
|
"eval_overall_recall": 0.8660968660968661, |
|
"eval_runtime": 0.9669, |
|
"eval_samples_per_second": 193.4, |
|
"eval_steps_per_second": 3.103, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 4535917761443712.0, |
|
"train_loss": 0.1449212483639987, |
|
"train_runtime": 1228.7031, |
|
"train_samples_per_second": 137.381, |
|
"train_steps_per_second": 8.627 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 4535917761443712.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|