|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 2.5185272693634033, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 0.9922, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.012048192771084338, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.0625, |
|
"eval_PERSON_recall": 0.006666666666666667, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.5609568953514099, |
|
"eval_overall_accuracy": 0.8435984481086324, |
|
"eval_overall_f1": 0.005347593582887699, |
|
"eval_overall_precision": 0.037037037037037035, |
|
"eval_overall_recall": 0.002881844380403458, |
|
"eval_runtime": 0.3848, |
|
"eval_samples_per_second": 485.953, |
|
"eval_steps_per_second": 7.796, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.2335773706436157, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.4811, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.416, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.48148148148148145, |
|
"eval_LOCATION_recall": 0.36619718309859156, |
|
"eval_ORGANIZATION_f1": 0.14285714285714285, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.14754098360655737, |
|
"eval_ORGANIZATION_recall": 0.13846153846153847, |
|
"eval_PERSON_f1": 0.6887052341597797, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.5868544600938967, |
|
"eval_PERSON_recall": 0.8333333333333334, |
|
"eval_QUANTITY_f1": 0.3692307692307692, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.375, |
|
"eval_QUANTITY_recall": 0.36363636363636365, |
|
"eval_TIME_f1": 0.7586206896551724, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7333333333333333, |
|
"eval_TIME_recall": 0.7857142857142857, |
|
"eval_loss": 0.32625189423561096, |
|
"eval_overall_accuracy": 0.9093113482056256, |
|
"eval_overall_f1": 0.5264586160108549, |
|
"eval_overall_precision": 0.49743589743589745, |
|
"eval_overall_recall": 0.5590778097982709, |
|
"eval_runtime": 0.3833, |
|
"eval_samples_per_second": 487.897, |
|
"eval_steps_per_second": 7.827, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 0.693739652633667, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.2923, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.6103896103896105, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5662650602409639, |
|
"eval_LOCATION_recall": 0.6619718309859155, |
|
"eval_ORGANIZATION_f1": 0.47619047619047616, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.4268292682926829, |
|
"eval_ORGANIZATION_recall": 0.5384615384615384, |
|
"eval_PERSON_f1": 0.8348909657320873, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.783625730994152, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.6133333333333334, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5476190476190477, |
|
"eval_QUANTITY_recall": 0.696969696969697, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.19018957018852234, |
|
"eval_overall_accuracy": 0.9338021338506305, |
|
"eval_overall_f1": 0.6948480845442536, |
|
"eval_overall_precision": 0.6414634146341464, |
|
"eval_overall_recall": 0.7579250720461095, |
|
"eval_runtime": 0.3878, |
|
"eval_samples_per_second": 482.181, |
|
"eval_steps_per_second": 7.736, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.1100132465362549, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2082, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.7388535031847132, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6744186046511628, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.638036809815951, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5306122448979592, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8589341692789968, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8106508875739645, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15403173863887787, |
|
"eval_overall_accuracy": 0.9459262851600388, |
|
"eval_overall_f1": 0.7700258397932818, |
|
"eval_overall_precision": 0.6978922716627635, |
|
"eval_overall_recall": 0.8587896253602305, |
|
"eval_runtime": 0.3873, |
|
"eval_samples_per_second": 482.781, |
|
"eval_steps_per_second": 7.745, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.3037128448486328, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.1772, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.7612903225806451, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7023809523809523, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.6756756756756758, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6024096385542169, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8698412698412699, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8303030303030303, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6835443037974683, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5869565217391305, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.14435262978076935, |
|
"eval_overall_accuracy": 0.9512609117361784, |
|
"eval_overall_f1": 0.7889182058047493, |
|
"eval_overall_precision": 0.7274939172749392, |
|
"eval_overall_recall": 0.861671469740634, |
|
"eval_runtime": 0.3878, |
|
"eval_samples_per_second": 482.157, |
|
"eval_steps_per_second": 7.735, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 0.9674538969993591, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1576, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.7151515151515151, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6276595744680851, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.674698795180723, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5544554455445545, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.866043613707165, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8128654970760234, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6363636363636364, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.509090909090909, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.78125, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6944444444444444, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1679927557706833, |
|
"eval_overall_accuracy": 0.9413191076624636, |
|
"eval_overall_f1": 0.763681592039801, |
|
"eval_overall_precision": 0.6717724288840262, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3864, |
|
"eval_samples_per_second": 483.937, |
|
"eval_steps_per_second": 7.764, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 1.824372410774231, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.147, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7124999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8606811145510835, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8034682080924855, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1446426808834076, |
|
"eval_overall_accuracy": 0.9519883608147429, |
|
"eval_overall_f1": 0.7927927927927928, |
|
"eval_overall_precision": 0.7162790697674418, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.4021, |
|
"eval_samples_per_second": 465.047, |
|
"eval_steps_per_second": 7.461, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.6194243431091309, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1329, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7453416149068322, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6666666666666666, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.6993865030674845, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5816326530612245, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8643533123028392, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8203592814371258, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.14050208032131195, |
|
"eval_overall_accuracy": 0.9517458777885548, |
|
"eval_overall_f1": 0.7948387096774193, |
|
"eval_overall_precision": 0.719626168224299, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3833, |
|
"eval_samples_per_second": 487.894, |
|
"eval_steps_per_second": 7.827, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 0.7105451226234436, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1309, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7814569536423841, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7375, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.6628571428571428, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5272727272727272, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.6419753086419753, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5416666666666666, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.7936507936507937, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13999436795711517, |
|
"eval_overall_accuracy": 0.9471387002909797, |
|
"eval_overall_f1": 0.7774936061381075, |
|
"eval_overall_precision": 0.6988505747126437, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3878, |
|
"eval_samples_per_second": 482.216, |
|
"eval_steps_per_second": 7.736, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.1783398389816284, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1247, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.778523489932886, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7435897435897436, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8653846153846153, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8333333333333334, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.6666666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5777777777777777, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1291128396987915, |
|
"eval_overall_accuracy": 0.953443258971872, |
|
"eval_overall_f1": 0.7989276139410187, |
|
"eval_overall_precision": 0.7468671679197995, |
|
"eval_overall_recall": 0.8587896253602305, |
|
"eval_runtime": 0.3867, |
|
"eval_samples_per_second": 483.627, |
|
"eval_steps_per_second": 7.759, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.8099766969680786, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1149, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7763157894736843, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7283950617283951, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.708860759493671, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6021505376344086, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.870967741935484, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84375, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.7384615384615384, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6486486486486487, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1423446536064148, |
|
"eval_overall_accuracy": 0.9493210475266731, |
|
"eval_overall_f1": 0.7900262467191601, |
|
"eval_overall_precision": 0.7253012048192771, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3857, |
|
"eval_samples_per_second": 484.776, |
|
"eval_steps_per_second": 7.777, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 0.6322067975997925, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1118, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.7239263803680982, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6413043478260869, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7124999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8125000000000001, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7222222222222222, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15240532159805298, |
|
"eval_overall_accuracy": 0.9493210475266731, |
|
"eval_overall_f1": 0.7902187902187902, |
|
"eval_overall_precision": 0.713953488372093, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3901, |
|
"eval_samples_per_second": 479.371, |
|
"eval_steps_per_second": 7.69, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.8599780797958374, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1051, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.759493670886076, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7307692307692307, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6263736263736264, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1298385113477707, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8165997322623828, |
|
"eval_overall_precision": 0.7625, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3867, |
|
"eval_samples_per_second": 483.589, |
|
"eval_steps_per_second": 7.758, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.4172143936157227, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1071, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.858974358974359, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8271604938271605, |
|
"eval_PERSON_recall": 0.8933333333333333, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13883614540100098, |
|
"eval_overall_accuracy": 0.9524733268671193, |
|
"eval_overall_f1": 0.7984084880636606, |
|
"eval_overall_precision": 0.7395577395577395, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3854, |
|
"eval_samples_per_second": 485.176, |
|
"eval_steps_per_second": 7.784, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.1519190073013306, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1001, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7261146496815286, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6195652173913043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14001114666461945, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8153034300791556, |
|
"eval_overall_precision": 0.7518248175182481, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3855, |
|
"eval_samples_per_second": 485.068, |
|
"eval_steps_per_second": 7.782, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 1.1742072105407715, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.0955, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8025477707006369, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7080745341614907, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.59375, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6753246753246752, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5909090909090909, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14204736053943634, |
|
"eval_overall_accuracy": 0.9541707080504365, |
|
"eval_overall_f1": 0.806282722513089, |
|
"eval_overall_precision": 0.7386091127098321, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3883, |
|
"eval_samples_per_second": 481.631, |
|
"eval_steps_per_second": 7.727, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 1.7436004877090454, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0905, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.7919463087248323, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7564102564102564, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.7936507936507937, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1411171555519104, |
|
"eval_overall_accuracy": 0.9565955383123181, |
|
"eval_overall_f1": 0.808, |
|
"eval_overall_precision": 0.7518610421836228, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3859, |
|
"eval_samples_per_second": 484.578, |
|
"eval_steps_per_second": 7.774, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.690143346786499, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0882, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.759493670886076, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7006369426751592, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5978260869565217, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6315789473684211, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5581395348837209, |
|
"eval_QUANTITY_recall": 0.7272727272727273, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14777430891990662, |
|
"eval_overall_accuracy": 0.9536857419980601, |
|
"eval_overall_f1": 0.8031914893617021, |
|
"eval_overall_precision": 0.745679012345679, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.3876, |
|
"eval_samples_per_second": 482.459, |
|
"eval_steps_per_second": 7.74, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.7800413370132446, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.0867, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.7755102040816326, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7272727272727272, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8774193548387097, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7027027027027027, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6341463414634146, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1365654617547989, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8049113233287859, |
|
"eval_overall_precision": 0.7642487046632125, |
|
"eval_overall_recall": 0.8501440922190202, |
|
"eval_runtime": 0.3898, |
|
"eval_samples_per_second": 479.734, |
|
"eval_steps_per_second": 7.696, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 1.5175530910491943, |
|
"learning_rate": 4e-05, |
|
"loss": 0.083, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8053691275167785, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7096774193548387, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6111111111111112, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8766233766233766, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8544303797468354, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.732394366197183, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14018449187278748, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8135135135135135, |
|
"eval_overall_precision": 0.7659033078880407, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3866, |
|
"eval_samples_per_second": 483.701, |
|
"eval_steps_per_second": 7.76, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 0.6179842352867126, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0818, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.6993865030674845, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5816326530612245, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9049180327868852, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8903225806451613, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6419753086419753, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5416666666666666, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15062209963798523, |
|
"eval_overall_accuracy": 0.9524733268671193, |
|
"eval_overall_f1": 0.8078947368421052, |
|
"eval_overall_precision": 0.7433414043583535, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3883, |
|
"eval_samples_per_second": 481.579, |
|
"eval_steps_per_second": 7.726, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.7422575354576111, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0824, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7006369426751592, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5978260869565217, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8580441640378549, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8143712574850299, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14866971969604492, |
|
"eval_overall_accuracy": 0.9546556741028128, |
|
"eval_overall_f1": 0.8010471204188482, |
|
"eval_overall_precision": 0.7338129496402878, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3904, |
|
"eval_samples_per_second": 478.947, |
|
"eval_steps_per_second": 7.684, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 0.7634256482124329, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.076, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8053691275167785, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7225806451612903, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6222222222222222, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8823529411764707, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8653846153846154, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.888888888888889, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9230769230769231, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13874635100364685, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8206521739130433, |
|
"eval_overall_precision": 0.7763496143958869, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.3855, |
|
"eval_samples_per_second": 485.092, |
|
"eval_steps_per_second": 7.782, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 0.7481046915054321, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0745, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7215189873417722, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6129032258064516, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7027027027027027, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6341463414634146, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.14388589560985565, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.821664464993395, |
|
"eval_overall_precision": 0.7585365853658537, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.387, |
|
"eval_samples_per_second": 483.235, |
|
"eval_steps_per_second": 7.752, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 0.7572817206382751, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0731, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7169811320754718, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6063829787234043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1537763774394989, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8222811671087533, |
|
"eval_overall_precision": 0.7616707616707616, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3899, |
|
"eval_samples_per_second": 479.593, |
|
"eval_steps_per_second": 7.694, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.5087524652481079, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0713, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7482993197278912, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6707317073170732, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6493506493506495, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5681818181818182, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14748218655586243, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8144192256341789, |
|
"eval_overall_precision": 0.7587064676616916, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3893, |
|
"eval_samples_per_second": 480.312, |
|
"eval_steps_per_second": 7.706, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 1.3006908893585205, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0712, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.7712418300653594, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7195121951219512, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7421383647798743, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6276595744680851, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8789808917197452, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8414634146341463, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6666666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5777777777777777, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.9090909090909091, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9259259259259259, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1678486168384552, |
|
"eval_overall_accuracy": 0.9517458777885548, |
|
"eval_overall_f1": 0.8089591567852438, |
|
"eval_overall_precision": 0.7451456310679612, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3855, |
|
"eval_samples_per_second": 485.032, |
|
"eval_steps_per_second": 7.781, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 0.8932152986526489, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.07, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.759493670886076, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7532467532467532, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.651685393258427, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8774193548387097, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.6486486486486487, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5853658536585366, |
|
"eval_QUANTITY_recall": 0.7272727272727273, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15593300759792328, |
|
"eval_overall_accuracy": 0.9544131910766246, |
|
"eval_overall_f1": 0.814516129032258, |
|
"eval_overall_precision": 0.7632241813602015, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3874, |
|
"eval_samples_per_second": 482.726, |
|
"eval_steps_per_second": 7.744, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.7077963948249817, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0687, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.802721088435374, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7763157894736842, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.728395061728395, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6082474226804123, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8737864077669903, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8490566037735849, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.732394366197183, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.14312958717346191, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8133333333333335, |
|
"eval_overall_precision": 0.7568238213399504, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3863, |
|
"eval_samples_per_second": 484.115, |
|
"eval_steps_per_second": 7.767, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.8946846723556519, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0665, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.8053691275167785, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7662337662337663, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6629213483146067, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1464053988456726, |
|
"eval_overall_accuracy": 0.9595053346265762, |
|
"eval_overall_f1": 0.830188679245283, |
|
"eval_overall_precision": 0.779746835443038, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3853, |
|
"eval_samples_per_second": 485.352, |
|
"eval_steps_per_second": 7.786, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.43450927734375, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0634, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7733333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6823529411764706, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.888888888888889, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8484848484848485, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7222222222222221, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15990784764289856, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8320000000000001, |
|
"eval_overall_precision": 0.7741935483870968, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.386, |
|
"eval_samples_per_second": 484.508, |
|
"eval_steps_per_second": 7.773, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.4396691620349884, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0602, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7388535031847134, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6304347826086957, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6666666666666667, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5952380952380952, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.17173334956169128, |
|
"eval_overall_accuracy": 0.9529582929194956, |
|
"eval_overall_f1": 0.8115942028985507, |
|
"eval_overall_precision": 0.7475728155339806, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.387, |
|
"eval_samples_per_second": 483.26, |
|
"eval_steps_per_second": 7.753, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.7759618163108826, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0633, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.7866666666666666, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7468354430379747, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.7534246575342466, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6790123456790124, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7222222222222221, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1525535136461258, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8228882833787465, |
|
"eval_overall_precision": 0.7803617571059431, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.386, |
|
"eval_samples_per_second": 484.395, |
|
"eval_steps_per_second": 7.771, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 1.0217112302780151, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0596, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7261146496815286, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6195652173913043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7123287671232875, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8070175438596492, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7931034482758621, |
|
"eval_TIME_recall": 0.8214285714285714, |
|
"eval_loss": 0.15602585673332214, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.8154050464807437, |
|
"eval_overall_precision": 0.7561576354679803, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.385, |
|
"eval_samples_per_second": 485.685, |
|
"eval_steps_per_second": 7.792, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.47391146421432495, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0591, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7261146496815286, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6195652173913043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8896103896103896, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8670886075949367, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7222222222222221, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1562255322933197, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8186666666666667, |
|
"eval_overall_precision": 0.7617866004962779, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3871, |
|
"eval_samples_per_second": 483.118, |
|
"eval_steps_per_second": 7.751, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 1.473497748374939, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0582, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7160493827160493, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5979381443298969, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8932038834951457, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1698862910270691, |
|
"eval_overall_accuracy": 0.9524733268671193, |
|
"eval_overall_f1": 0.8184210526315788, |
|
"eval_overall_precision": 0.7530266343825666, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3888, |
|
"eval_samples_per_second": 480.937, |
|
"eval_steps_per_second": 7.716, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 0.5742448568344116, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0567, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.775, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6966292134831461, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7169811320754718, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6063829787234043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17796191573143005, |
|
"eval_overall_accuracy": 0.9498060135790495, |
|
"eval_overall_f1": 0.8073394495412844, |
|
"eval_overall_precision": 0.7403846153846154, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3904, |
|
"eval_samples_per_second": 479.01, |
|
"eval_steps_per_second": 7.685, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.6908618211746216, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0568, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8053691275167785, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7692307692307693, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7482993197278912, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6707317073170732, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6933333333333334, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6190476190476191, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1589268296957016, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8216216216216217, |
|
"eval_overall_precision": 0.7735368956743003, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.387, |
|
"eval_samples_per_second": 483.227, |
|
"eval_steps_per_second": 7.752, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.37814459204673767, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0553, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.759493670886076, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6896551724137931, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7195121951219511, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5959595959595959, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8853503184713376, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8475609756097561, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.17944246530532837, |
|
"eval_overall_accuracy": 0.9500484966052376, |
|
"eval_overall_f1": 0.8120104438642298, |
|
"eval_overall_precision": 0.7422434367541766, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3856, |
|
"eval_samples_per_second": 484.921, |
|
"eval_steps_per_second": 7.779, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 0.3985283672809601, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0522, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.7924528301886792, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7159090909090909, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8825396825396825, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8424242424242424, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.732394366197183, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.16948159039020538, |
|
"eval_overall_accuracy": 0.9551406401551892, |
|
"eval_overall_f1": 0.8196286472148541, |
|
"eval_overall_precision": 0.7592137592137592, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3866, |
|
"eval_samples_per_second": 483.76, |
|
"eval_steps_per_second": 7.761, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.4095101058483124, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0535, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6842105263157895, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6046511627906976, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.16789713501930237, |
|
"eval_overall_accuracy": 0.9517458777885548, |
|
"eval_overall_f1": 0.8090185676392573, |
|
"eval_overall_precision": 0.7493857493857494, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3862, |
|
"eval_samples_per_second": 484.225, |
|
"eval_steps_per_second": 7.768, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.30107811093330383, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0507, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7248322147651007, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8867313915857605, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15727120637893677, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.8221024258760108, |
|
"eval_overall_precision": 0.7721518987341772, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3852, |
|
"eval_samples_per_second": 485.428, |
|
"eval_steps_per_second": 7.788, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.3901791274547577, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0501, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6967741935483871, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1803949922323227, |
|
"eval_overall_accuracy": 0.9524733268671193, |
|
"eval_overall_f1": 0.8100263852242744, |
|
"eval_overall_precision": 0.7469586374695864, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3846, |
|
"eval_samples_per_second": 486.267, |
|
"eval_steps_per_second": 7.801, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 0.7794935703277588, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0491, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.7870967741935485, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.6918238993710691, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5851063829787234, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1680927574634552, |
|
"eval_overall_accuracy": 0.953443258971872, |
|
"eval_overall_f1": 0.8105960264900663, |
|
"eval_overall_precision": 0.75, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.387, |
|
"eval_samples_per_second": 483.206, |
|
"eval_steps_per_second": 7.752, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 1.7887659072875977, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0478, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.16480599343776703, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8297297297297298, |
|
"eval_overall_precision": 0.7811704834605598, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3859, |
|
"eval_samples_per_second": 484.601, |
|
"eval_steps_per_second": 7.774, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.7143243551254272, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0475, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.7898089171974522, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15505646169185638, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.824631860776439, |
|
"eval_overall_precision": 0.77, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3863, |
|
"eval_samples_per_second": 484.039, |
|
"eval_steps_per_second": 7.765, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.987457811832428, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0462, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7189542483660131, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.16851799190044403, |
|
"eval_overall_accuracy": 0.954898157129001, |
|
"eval_overall_f1": 0.8139223560910308, |
|
"eval_overall_precision": 0.76, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3876, |
|
"eval_samples_per_second": 482.46, |
|
"eval_steps_per_second": 7.74, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 0.8889041543006897, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0467, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7333333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.17139677703380585, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8306451612903226, |
|
"eval_overall_precision": 0.7783375314861462, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3868, |
|
"eval_samples_per_second": 483.496, |
|
"eval_steps_per_second": 7.757, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.43323248624801636, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0462, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7714285714285715, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1640593409538269, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8288043478260869, |
|
"eval_overall_precision": 0.7840616966580977, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3874, |
|
"eval_samples_per_second": 482.695, |
|
"eval_steps_per_second": 7.744, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 1.8610317707061768, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0467, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.16927781701087952, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8183041722745625, |
|
"eval_overall_precision": 0.7676767676767676, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3864, |
|
"eval_samples_per_second": 483.901, |
|
"eval_steps_per_second": 7.763, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.744925320148468, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0437, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.7898089171974522, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.6896551724137931, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.7692307692307693, |
|
"eval_PERSON_f1": 0.8745980707395499, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.84472049689441, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17594219744205475, |
|
"eval_overall_accuracy": 0.9551406401551892, |
|
"eval_overall_f1": 0.8075370121130553, |
|
"eval_overall_precision": 0.7575757575757576, |
|
"eval_overall_recall": 0.8645533141210374, |
|
"eval_runtime": 0.3854, |
|
"eval_samples_per_second": 485.269, |
|
"eval_steps_per_second": 7.785, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.9806845784187317, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0435, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8025477707006369, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18336325883865356, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8273092369477911, |
|
"eval_overall_precision": 0.7725, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.387, |
|
"eval_samples_per_second": 483.258, |
|
"eval_steps_per_second": 7.753, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.8235753178596497, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0441, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7307692307692307, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6263736263736264, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1896522045135498, |
|
"eval_overall_accuracy": 0.9546556741028128, |
|
"eval_overall_f1": 0.8249336870026525, |
|
"eval_overall_precision": 0.7641277641277642, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3882, |
|
"eval_samples_per_second": 481.674, |
|
"eval_steps_per_second": 7.727, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.6915778517723083, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.042, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7402597402597403, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6404494382022472, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18752093613147736, |
|
"eval_overall_accuracy": 0.9539282250242483, |
|
"eval_overall_f1": 0.8196286472148541, |
|
"eval_overall_precision": 0.7592137592137592, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3905, |
|
"eval_samples_per_second": 478.818, |
|
"eval_steps_per_second": 7.682, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 0.8931111097335815, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0414, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6923076923076923, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5934065934065934, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6842105263157895, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6046511627906976, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18678565323352814, |
|
"eval_overall_accuracy": 0.9544131910766246, |
|
"eval_overall_f1": 0.8031496062992126, |
|
"eval_overall_precision": 0.7373493975903614, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3856, |
|
"eval_samples_per_second": 485.009, |
|
"eval_steps_per_second": 7.781, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.4860210418701172, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0408, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7152317880794703, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.627906976744186, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.732394366197183, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17208231985569, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8161073825503355, |
|
"eval_overall_precision": 0.7638190954773869, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3889, |
|
"eval_samples_per_second": 480.88, |
|
"eval_steps_per_second": 7.715, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.5651527047157288, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0388, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7222222222222222, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6582278481012658, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7123287671232875, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.18390165269374847, |
|
"eval_overall_accuracy": 0.9565955383123181, |
|
"eval_overall_f1": 0.8178137651821863, |
|
"eval_overall_precision": 0.7690355329949239, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3888, |
|
"eval_samples_per_second": 481.0, |
|
"eval_steps_per_second": 7.717, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.2999099791049957, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.039, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.7894736842105262, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7407407407407407, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7006369426751592, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5978260869565217, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7123287671232875, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17726965248584747, |
|
"eval_overall_accuracy": 0.9527158098933075, |
|
"eval_overall_f1": 0.8095872170439414, |
|
"eval_overall_precision": 0.7524752475247525, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3872, |
|
"eval_samples_per_second": 482.921, |
|
"eval_steps_per_second": 7.747, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 0.43868881464004517, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0414, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8774193548387097, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.16531790792942047, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8184281842818427, |
|
"eval_overall_precision": 0.7723785166240409, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.3889, |
|
"eval_samples_per_second": 480.89, |
|
"eval_steps_per_second": 7.715, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.5318551659584045, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0379, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.7808219178082192, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.76, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.7172413793103448, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.65, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1694074124097824, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.8142076502732241, |
|
"eval_overall_precision": 0.7740259740259741, |
|
"eval_overall_recall": 0.8587896253602305, |
|
"eval_runtime": 0.3853, |
|
"eval_samples_per_second": 485.37, |
|
"eval_steps_per_second": 7.787, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 1.2059674263000488, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0391, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6136363636363636, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7123287671232875, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1873074322938919, |
|
"eval_overall_accuracy": 0.9551406401551892, |
|
"eval_overall_f1": 0.8138297872340426, |
|
"eval_overall_precision": 0.7555555555555555, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.393, |
|
"eval_samples_per_second": 475.865, |
|
"eval_steps_per_second": 7.634, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.812824010848999, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0372, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7248322147651007, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8774193548387097, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.17852064967155457, |
|
"eval_overall_accuracy": 0.9558680892337537, |
|
"eval_overall_f1": 0.8176943699731903, |
|
"eval_overall_precision": 0.7644110275689223, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3865, |
|
"eval_samples_per_second": 483.888, |
|
"eval_steps_per_second": 7.763, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.8590715527534485, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0371, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17511434853076935, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8232118758434548, |
|
"eval_overall_precision": 0.7741116751269036, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3898, |
|
"eval_samples_per_second": 479.785, |
|
"eval_steps_per_second": 7.697, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.4557998478412628, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0348, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7248322147651007, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6428571428571429, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7714285714285715, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1811322569847107, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.825268817204301, |
|
"eval_overall_precision": 0.7732997481108312, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3884, |
|
"eval_samples_per_second": 481.467, |
|
"eval_steps_per_second": 7.724, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 0.6341075897216797, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0338, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1845623105764389, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.8203753351206434, |
|
"eval_overall_precision": 0.7669172932330827, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3877, |
|
"eval_samples_per_second": 482.316, |
|
"eval_steps_per_second": 7.738, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.8572676777839661, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.033, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.7848101265822784, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7126436781609196, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.728476821192053, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6395348837209303, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1916947364807129, |
|
"eval_overall_accuracy": 0.9553831231813773, |
|
"eval_overall_f1": 0.8207171314741034, |
|
"eval_overall_precision": 0.7610837438423645, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3895, |
|
"eval_samples_per_second": 480.163, |
|
"eval_steps_per_second": 7.703, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.2351032942533493, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0347, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.8079470198675496, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7625, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7019867549668873, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6162790697674418, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18072670698165894, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8189189189189189, |
|
"eval_overall_precision": 0.7709923664122137, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3888, |
|
"eval_samples_per_second": 481.006, |
|
"eval_steps_per_second": 7.717, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.4664683938026428, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.034, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8896103896103896, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8670886075949367, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1870609074831009, |
|
"eval_overall_accuracy": 0.9558680892337537, |
|
"eval_overall_f1": 0.8165997322623828, |
|
"eval_overall_precision": 0.7625, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3882, |
|
"eval_samples_per_second": 481.675, |
|
"eval_steps_per_second": 7.727, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.3841381072998047, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0319, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.775, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6966292134831461, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18617138266563416, |
|
"eval_overall_accuracy": 0.954898157129001, |
|
"eval_overall_f1": 0.8181818181818181, |
|
"eval_overall_precision": 0.7630922693266833, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3893, |
|
"eval_samples_per_second": 480.405, |
|
"eval_steps_per_second": 7.707, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.48607921600341797, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0338, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7199999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6352941176470588, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1894809454679489, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.824631860776439, |
|
"eval_overall_precision": 0.77, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3875, |
|
"eval_samples_per_second": 482.595, |
|
"eval_steps_per_second": 7.742, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.6728916168212891, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0306, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.728476821192053, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6395348837209303, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20611025393009186, |
|
"eval_overall_accuracy": 0.9558680892337537, |
|
"eval_overall_f1": 0.8202396804260986, |
|
"eval_overall_precision": 0.7623762376237624, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3866, |
|
"eval_samples_per_second": 483.747, |
|
"eval_steps_per_second": 7.761, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.954484760761261, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0343, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19823096692562103, |
|
"eval_overall_accuracy": 0.9541707080504365, |
|
"eval_overall_f1": 0.8202396804260986, |
|
"eval_overall_precision": 0.7623762376237624, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3914, |
|
"eval_samples_per_second": 477.758, |
|
"eval_steps_per_second": 7.665, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.27965471148490906, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0308, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7586206896551724, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6875, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.732394366197183, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19675639271736145, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8247978436657682, |
|
"eval_overall_precision": 0.7746835443037975, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3896, |
|
"eval_samples_per_second": 480.01, |
|
"eval_steps_per_second": 7.701, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.283292531967163, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0328, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.7770700636942676, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19934506714344025, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.8172043010752689, |
|
"eval_overall_precision": 0.7657430730478589, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3876, |
|
"eval_samples_per_second": 482.397, |
|
"eval_steps_per_second": 7.739, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 1.0608142614364624, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0328, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7333333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8867313915857605, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19247645139694214, |
|
"eval_overall_accuracy": 0.9558680892337537, |
|
"eval_overall_f1": 0.814516129032258, |
|
"eval_overall_precision": 0.7632241813602015, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3884, |
|
"eval_samples_per_second": 481.515, |
|
"eval_steps_per_second": 7.725, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.5310276746749878, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0314, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.7631578947368421, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7160493827160493, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.732394366197183, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19101466238498688, |
|
"eval_overall_accuracy": 0.9553831231813773, |
|
"eval_overall_f1": 0.8151147098515519, |
|
"eval_overall_precision": 0.766497461928934, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.389, |
|
"eval_samples_per_second": 480.741, |
|
"eval_steps_per_second": 7.712, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.7759119868278503, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0304, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7027027027027027, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6265060240963856, |
|
"eval_ORGANIZATION_recall": 0.8, |
|
"eval_PERSON_f1": 0.8753993610223643, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8404907975460123, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19821016490459442, |
|
"eval_overall_accuracy": 0.9544131910766246, |
|
"eval_overall_f1": 0.8037383177570094, |
|
"eval_overall_precision": 0.7487562189054726, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3876, |
|
"eval_samples_per_second": 482.51, |
|
"eval_steps_per_second": 7.741, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.5382179021835327, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0318, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7105263157894737, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6206896551724138, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6578947368421053, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5813953488372093, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2088189721107483, |
|
"eval_overall_accuracy": 0.9527158098933075, |
|
"eval_overall_f1": 0.7994722955145119, |
|
"eval_overall_precision": 0.7372262773722628, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3895, |
|
"eval_samples_per_second": 480.105, |
|
"eval_steps_per_second": 7.702, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 0.7348619103431702, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0303, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.726027397260274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.654320987654321, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.704225352112676, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20289956033229828, |
|
"eval_overall_accuracy": 0.9539282250242483, |
|
"eval_overall_f1": 0.8074866310160428, |
|
"eval_overall_precision": 0.7531172069825436, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.392, |
|
"eval_samples_per_second": 476.992, |
|
"eval_steps_per_second": 7.652, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.42746540904045105, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0289, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.7682119205298014, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.725, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.7210884353741497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6463414634146342, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6944444444444444, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6410256410256411, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2005331665277481, |
|
"eval_overall_accuracy": 0.9539282250242483, |
|
"eval_overall_f1": 0.8032345013477089, |
|
"eval_overall_precision": 0.7544303797468355, |
|
"eval_overall_recall": 0.8587896253602305, |
|
"eval_runtime": 0.3897, |
|
"eval_samples_per_second": 479.848, |
|
"eval_steps_per_second": 7.698, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.303906112909317, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0283, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.7692307692307694, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7448275862068966, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.675, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.704225352112676, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20049220323562622, |
|
"eval_overall_accuracy": 0.9558680892337537, |
|
"eval_overall_f1": 0.8113207547169812, |
|
"eval_overall_precision": 0.7620253164556962, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3866, |
|
"eval_samples_per_second": 483.757, |
|
"eval_steps_per_second": 7.761, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 1.8275718688964844, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0303, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7333333333333334, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6470588235294118, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7142857142857142, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19804218411445618, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8167115902964959, |
|
"eval_overall_precision": 0.7670886075949367, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3912, |
|
"eval_samples_per_second": 478.031, |
|
"eval_steps_per_second": 7.669, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 3.0445024967193604, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0281, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.7843137254901961, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7317073170731707, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7346938775510204, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6585365853658537, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.704225352112676, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6578947368421053, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19731304049491882, |
|
"eval_overall_accuracy": 0.9551406401551892, |
|
"eval_overall_f1": 0.8113207547169812, |
|
"eval_overall_precision": 0.7620253164556962, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3907, |
|
"eval_samples_per_second": 478.583, |
|
"eval_steps_per_second": 7.678, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.6099753379821777, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0281, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.7848101265822784, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7126436781609196, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7142857142857142, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20074868202209473, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8165997322623828, |
|
"eval_overall_precision": 0.7625, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3897, |
|
"eval_samples_per_second": 479.814, |
|
"eval_steps_per_second": 7.698, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.7372535467147827, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0291, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.7692307692307694, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7058823529411765, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7142857142857142, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6756756756756757, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20446744561195374, |
|
"eval_overall_accuracy": 0.9553831231813773, |
|
"eval_overall_f1": 0.8123324396782842, |
|
"eval_overall_precision": 0.7593984962406015, |
|
"eval_overall_recall": 0.8731988472622478, |
|
"eval_runtime": 0.3955, |
|
"eval_samples_per_second": 472.842, |
|
"eval_steps_per_second": 7.586, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.5419071316719055, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0286, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7466666666666668, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6588235294117647, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19124767184257507, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8247978436657682, |
|
"eval_overall_precision": 0.7746835443037975, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3984, |
|
"eval_samples_per_second": 469.353, |
|
"eval_steps_per_second": 7.53, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 1.295188546180725, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0267, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7466666666666668, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6588235294117647, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1960640400648117, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8241610738255033, |
|
"eval_overall_precision": 0.7713567839195979, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3949, |
|
"eval_samples_per_second": 473.507, |
|
"eval_steps_per_second": 7.596, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 0.27405989170074463, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0282, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8867313915857605, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6849315068493151, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19417804479599, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8150134048257373, |
|
"eval_overall_precision": 0.7619047619047619, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3924, |
|
"eval_samples_per_second": 476.565, |
|
"eval_steps_per_second": 7.645, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.466235876083374, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0251, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7619047619047619, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6829268292682927, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6849315068493151, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.625, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2023736834526062, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.8203753351206434, |
|
"eval_overall_precision": 0.7669172932330827, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3932, |
|
"eval_samples_per_second": 475.644, |
|
"eval_steps_per_second": 7.631, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.620521068572998, |
|
"learning_rate": 5e-06, |
|
"loss": 0.027, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7714285714285715, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7297297297297297, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19653601944446564, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8297297297297298, |
|
"eval_overall_precision": 0.7811704834605598, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3926, |
|
"eval_samples_per_second": 476.265, |
|
"eval_steps_per_second": 7.641, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 1.394244909286499, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0268, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7605633802816901, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7105263157894737, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2078668475151062, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.8236877523553162, |
|
"eval_overall_precision": 0.7727272727272727, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3926, |
|
"eval_samples_per_second": 476.299, |
|
"eval_steps_per_second": 7.641, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.33064666390419006, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0256, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7466666666666668, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6588235294117647, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19762425124645233, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8257372654155496, |
|
"eval_overall_precision": 0.7719298245614035, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3911, |
|
"eval_samples_per_second": 478.123, |
|
"eval_steps_per_second": 7.67, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.47633665800094604, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0258, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1961781531572342, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8214765100671141, |
|
"eval_overall_precision": 0.7688442211055276, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3912, |
|
"eval_samples_per_second": 478.005, |
|
"eval_steps_per_second": 7.669, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.8689398169517517, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0233, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7466666666666668, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6588235294117647, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19755157828330994, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8214765100671141, |
|
"eval_overall_precision": 0.7688442211055276, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3938, |
|
"eval_samples_per_second": 474.89, |
|
"eval_steps_per_second": 7.619, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.12069670855998993, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0259, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7482993197278912, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6707317073170732, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19969353079795837, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8221024258760108, |
|
"eval_overall_precision": 0.7721518987341772, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3908, |
|
"eval_samples_per_second": 478.563, |
|
"eval_steps_per_second": 7.677, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.6587622761726379, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0253, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20329639315605164, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.8203753351206434, |
|
"eval_overall_precision": 0.7669172932330827, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.391, |
|
"eval_samples_per_second": 478.228, |
|
"eval_steps_per_second": 7.672, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.5734129548072815, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0251, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.7870967741935485, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20106351375579834, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8225806451612904, |
|
"eval_overall_precision": 0.7707808564231738, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3918, |
|
"eval_samples_per_second": 477.341, |
|
"eval_steps_per_second": 7.658, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.6452818512916565, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0237, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.7948717948717949, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7294117647058823, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20484283566474915, |
|
"eval_overall_accuracy": 0.9565955383123181, |
|
"eval_overall_f1": 0.823529411764706, |
|
"eval_overall_precision": 0.7680798004987531, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3905, |
|
"eval_samples_per_second": 478.82, |
|
"eval_steps_per_second": 7.682, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.052759163081645966, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.024, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7516778523489933, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.20229747891426086, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8268456375838926, |
|
"eval_overall_precision": 0.7738693467336684, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3938, |
|
"eval_samples_per_second": 474.901, |
|
"eval_steps_per_second": 7.619, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.5731909871101379, |
|
"learning_rate": 0.0, |
|
"loss": 0.0257, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7567567567567568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6746987951807228, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7428571428571429, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7027027027027027, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.2022850662469864, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8279569892473119, |
|
"eval_overall_precision": 0.7758186397984886, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3925, |
|
"eval_samples_per_second": 476.464, |
|
"eval_steps_per_second": 7.644, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 5123217774191952.0, |
|
"train_loss": 0.07238403747666557, |
|
"train_runtime": 634.3549, |
|
"train_samples_per_second": 266.097, |
|
"train_steps_per_second": 16.71 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 5123217774191952.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|