|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 10600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 2.1874585151672363, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 1.0045, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.012121212121212121, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.06666666666666667, |
|
"eval_PERSON_recall": 0.006666666666666667, |
|
"eval_QUANTITY_f1": 0.0, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.0, |
|
"eval_QUANTITY_recall": 0.0, |
|
"eval_TIME_f1": 0.0, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.0, |
|
"eval_TIME_recall": 0.0, |
|
"eval_loss": 0.5767342448234558, |
|
"eval_overall_accuracy": 0.8433559650824443, |
|
"eval_overall_f1": 0.005434782608695652, |
|
"eval_overall_precision": 0.047619047619047616, |
|
"eval_overall_recall": 0.002881844380403458, |
|
"eval_runtime": 0.3512, |
|
"eval_samples_per_second": 532.399, |
|
"eval_steps_per_second": 8.541, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 1.000261664390564, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.4985, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.3859649122807017, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.5116279069767442, |
|
"eval_LOCATION_recall": 0.30985915492957744, |
|
"eval_ORGANIZATION_f1": 0.14184397163120568, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.13157894736842105, |
|
"eval_ORGANIZATION_recall": 0.15384615384615385, |
|
"eval_PERSON_f1": 0.7315634218289085, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.656084656084656, |
|
"eval_PERSON_recall": 0.8266666666666667, |
|
"eval_QUANTITY_f1": 0.15625, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.16129032258064516, |
|
"eval_QUANTITY_recall": 0.15151515151515152, |
|
"eval_TIME_f1": 0.7, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.65625, |
|
"eval_TIME_recall": 0.75, |
|
"eval_loss": 0.34785470366477966, |
|
"eval_overall_accuracy": 0.9083414161008729, |
|
"eval_overall_f1": 0.5069637883008357, |
|
"eval_overall_precision": 0.49056603773584906, |
|
"eval_overall_recall": 0.5244956772334294, |
|
"eval_runtime": 0.3485, |
|
"eval_samples_per_second": 536.657, |
|
"eval_steps_per_second": 8.609, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 0.8842161297798157, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.2936, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.6119402985074627, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6507936507936508, |
|
"eval_LOCATION_recall": 0.5774647887323944, |
|
"eval_ORGANIZATION_f1": 0.4255319148936171, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.39473684210526316, |
|
"eval_ORGANIZATION_recall": 0.46153846153846156, |
|
"eval_PERSON_f1": 0.8238993710691823, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7797619047619048, |
|
"eval_PERSON_recall": 0.8733333333333333, |
|
"eval_QUANTITY_f1": 0.5866666666666667, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5238095238095238, |
|
"eval_QUANTITY_recall": 0.6666666666666666, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.2019408941268921, |
|
"eval_overall_accuracy": 0.9340446168768186, |
|
"eval_overall_f1": 0.6850828729281768, |
|
"eval_overall_precision": 0.6578249336870027, |
|
"eval_overall_recall": 0.7146974063400576, |
|
"eval_runtime": 0.3515, |
|
"eval_samples_per_second": 531.999, |
|
"eval_steps_per_second": 8.535, |
|
"step": 318 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 1.0422954559326172, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.2113, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.6666666666666667, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.611764705882353, |
|
"eval_LOCATION_recall": 0.7323943661971831, |
|
"eval_ORGANIZATION_f1": 0.6583850931677019, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5520833333333334, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8473520249221183, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7953216374269005, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1662513017654419, |
|
"eval_overall_accuracy": 0.9459262851600388, |
|
"eval_overall_f1": 0.7574578469520102, |
|
"eval_overall_precision": 0.6886792452830188, |
|
"eval_overall_recall": 0.8414985590778098, |
|
"eval_runtime": 0.3504, |
|
"eval_samples_per_second": 533.64, |
|
"eval_steps_per_second": 8.561, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 1.0871312618255615, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.1824, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.6951219512195121, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6129032258064516, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.6580645161290322, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5666666666666667, |
|
"eval_ORGANIZATION_recall": 0.7846153846153846, |
|
"eval_PERSON_f1": 0.8607594936708859, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8192771084337349, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7088607594936709, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6086956521739131, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.75, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6666666666666666, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.15956708788871765, |
|
"eval_overall_accuracy": 0.944713870029098, |
|
"eval_overall_f1": 0.7609254498714653, |
|
"eval_overall_precision": 0.6867749419953596, |
|
"eval_overall_recall": 0.8530259365994236, |
|
"eval_runtime": 0.3507, |
|
"eval_samples_per_second": 533.247, |
|
"eval_steps_per_second": 8.555, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.1978598833084106, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.1647, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.6946107784431137, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6041666666666666, |
|
"eval_LOCATION_recall": 0.8169014084507042, |
|
"eval_ORGANIZATION_f1": 0.651685393258427, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5132743362831859, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8404907975460122, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.7784090909090909, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.6588235294117647, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5384615384615384, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.7164179104477612, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.6153846153846154, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.1713540256023407, |
|
"eval_overall_accuracy": 0.9369544131910766, |
|
"eval_overall_f1": 0.741190765492102, |
|
"eval_overall_precision": 0.6407563025210085, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3521, |
|
"eval_samples_per_second": 531.071, |
|
"eval_steps_per_second": 8.52, |
|
"step": 636 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 1.5508997440338135, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1533, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.6993865030674846, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6195652173913043, |
|
"eval_LOCATION_recall": 0.8028169014084507, |
|
"eval_ORGANIZATION_f1": 0.6790123456790124, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5670103092783505, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8598130841121495, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8070175438596491, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14624279737472534, |
|
"eval_overall_accuracy": 0.9510184287099903, |
|
"eval_overall_f1": 0.770408163265306, |
|
"eval_overall_precision": 0.6910755148741419, |
|
"eval_overall_recall": 0.8703170028818443, |
|
"eval_runtime": 0.3512, |
|
"eval_samples_per_second": 532.397, |
|
"eval_steps_per_second": 8.541, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.8642424941062927, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1405, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7407407407407407, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6593406593406593, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.6783625730994152, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5471698113207547, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8717948717948718, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8395061728395061, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13807082176208496, |
|
"eval_overall_accuracy": 0.950533462657614, |
|
"eval_overall_f1": 0.7861715749039692, |
|
"eval_overall_precision": 0.7073732718894009, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3504, |
|
"eval_samples_per_second": 533.624, |
|
"eval_steps_per_second": 8.561, |
|
"step": 848 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.233667254447937, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1341, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.6785714285714285, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5533980582524272, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8562091503267975, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8397435897435898, |
|
"eval_PERSON_recall": 0.8733333333333333, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13261349499225616, |
|
"eval_overall_accuracy": 0.9495635305528612, |
|
"eval_overall_f1": 0.7869281045751635, |
|
"eval_overall_precision": 0.7200956937799043, |
|
"eval_overall_recall": 0.8674351585014409, |
|
"eval_runtime": 0.3537, |
|
"eval_samples_per_second": 528.626, |
|
"eval_steps_per_second": 8.481, |
|
"step": 954 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.0353517532348633, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1274, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7096774193548387, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6111111111111112, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1223028227686882, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8191489361702129, |
|
"eval_overall_precision": 0.7604938271604939, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3511, |
|
"eval_samples_per_second": 532.631, |
|
"eval_steps_per_second": 8.545, |
|
"step": 1060 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 0.7219051122665405, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1232, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7204968944099378, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6041666666666666, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1300116926431656, |
|
"eval_overall_accuracy": 0.9529582929194956, |
|
"eval_overall_f1": 0.8083989501312335, |
|
"eval_overall_precision": 0.7421686746987952, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3501, |
|
"eval_samples_per_second": 534.192, |
|
"eval_steps_per_second": 8.57, |
|
"step": 1166 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 1.0894474983215332, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1195, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.728395061728395, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6483516483516484, |
|
"eval_LOCATION_recall": 0.8309859154929577, |
|
"eval_ORGANIZATION_f1": 0.6909090909090909, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.57, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.7999999999999999, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.75, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14111082255840302, |
|
"eval_overall_accuracy": 0.9522308438409312, |
|
"eval_overall_f1": 0.7917205692108668, |
|
"eval_overall_precision": 0.7183098591549296, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3502, |
|
"eval_samples_per_second": 534.002, |
|
"eval_steps_per_second": 8.567, |
|
"step": 1272 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 0.5753965377807617, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1138, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7239263803680982, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6020408163265306, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8838709677419355, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.85625, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.9259259259259259, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9615384615384616, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12571823596954346, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8260292164674636, |
|
"eval_overall_precision": 0.7660098522167488, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3506, |
|
"eval_samples_per_second": 533.355, |
|
"eval_steps_per_second": 8.556, |
|
"step": 1378 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 1.7395552396774292, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1106, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.7973856209150327, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7439024390243902, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7160493827160493, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5979381443298969, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7088607594936709, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6086956521739131, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1278010457754135, |
|
"eval_overall_accuracy": 0.9541707080504365, |
|
"eval_overall_f1": 0.8104575163398693, |
|
"eval_overall_precision": 0.7416267942583732, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3503, |
|
"eval_samples_per_second": 533.795, |
|
"eval_steps_per_second": 8.564, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 1.1085916757583618, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1037, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7375, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6210526315789474, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.691358024691358, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5833333333333334, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1332232654094696, |
|
"eval_overall_accuracy": 0.953443258971872, |
|
"eval_overall_f1": 0.81877444589309, |
|
"eval_overall_precision": 0.7476190476190476, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.3501, |
|
"eval_samples_per_second": 534.13, |
|
"eval_steps_per_second": 8.569, |
|
"step": 1590 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 1.2298065423965454, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.1015, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.7870967741935485, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7453416149068324, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6506024096385542, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.54, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13960066437721252, |
|
"eval_overall_accuracy": 0.9539282250242483, |
|
"eval_overall_f1": 0.811443433029909, |
|
"eval_overall_precision": 0.7393364928909952, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3495, |
|
"eval_samples_per_second": 535.049, |
|
"eval_steps_per_second": 8.584, |
|
"step": 1696 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.7031758427619934, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0958, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.728395061728395, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6082474226804123, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12715467810630798, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8274044795783926, |
|
"eval_overall_precision": 0.7621359223300971, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.3498, |
|
"eval_samples_per_second": 534.552, |
|
"eval_steps_per_second": 8.576, |
|
"step": 1802 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.8438174724578857, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0957, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7017543859649122, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5660377358490566, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14869378507137299, |
|
"eval_overall_accuracy": 0.9527158098933075, |
|
"eval_overall_f1": 0.8067010309278351, |
|
"eval_overall_precision": 0.7296037296037297, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3502, |
|
"eval_samples_per_second": 534.029, |
|
"eval_steps_per_second": 8.567, |
|
"step": 1908 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 0.7291853427886963, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.0943, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7195121951219511, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5959595959595959, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12535077333450317, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8258575197889182, |
|
"eval_overall_precision": 0.7615571776155717, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3513, |
|
"eval_samples_per_second": 532.375, |
|
"eval_steps_per_second": 8.541, |
|
"step": 2014 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 1.0950889587402344, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0915, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7421383647798743, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6276595744680851, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7466666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.9259259259259259, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9615384615384616, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.12668967247009277, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8335552596537948, |
|
"eval_overall_precision": 0.7747524752475248, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3504, |
|
"eval_samples_per_second": 533.636, |
|
"eval_steps_per_second": 8.561, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 1.227335810661316, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0834, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.7672955974842768, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6931818181818182, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7239263803680982, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6020408163265306, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6410256410256411, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5555555555555556, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1432582437992096, |
|
"eval_overall_accuracy": 0.953443258971872, |
|
"eval_overall_f1": 0.8057366362451109, |
|
"eval_overall_precision": 0.7357142857142858, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3505, |
|
"eval_samples_per_second": 533.585, |
|
"eval_steps_per_second": 8.56, |
|
"step": 2226 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.8867971301078796, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0839, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7329192546583851, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6145833333333334, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6582278481012658, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5652173913043478, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14338690042495728, |
|
"eval_overall_accuracy": 0.9546556741028128, |
|
"eval_overall_f1": 0.8184210526315788, |
|
"eval_overall_precision": 0.7530266343825666, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3497, |
|
"eval_samples_per_second": 534.745, |
|
"eval_steps_per_second": 8.579, |
|
"step": 2332 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 1.0698140859603882, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.0807, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.782051282051282, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7176470588235294, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7195121951219511, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5959595959595959, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.912621359223301, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8867924528301887, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13598859310150146, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8252299605781866, |
|
"eval_overall_precision": 0.7584541062801933, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.3499, |
|
"eval_samples_per_second": 534.445, |
|
"eval_steps_per_second": 8.574, |
|
"step": 2438 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 0.7420476675033569, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0771, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.7870967741935485, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7215189873417722, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6129032258064516, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9137380191693292, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8773006134969326, |
|
"eval_PERSON_recall": 0.9533333333333334, |
|
"eval_QUANTITY_f1": 0.6419753086419753, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5416666666666666, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8571428571428571, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8571428571428571, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14340347051620483, |
|
"eval_overall_accuracy": 0.9539282250242483, |
|
"eval_overall_f1": 0.8152031454783748, |
|
"eval_overall_precision": 0.7475961538461539, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3509, |
|
"eval_samples_per_second": 532.923, |
|
"eval_steps_per_second": 8.55, |
|
"step": 2544 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 1.0963969230651855, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0772, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.7770700636942676, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7093023255813954, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7065868263473054, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5784313725490197, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6428571428571428, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5294117647058824, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1520393043756485, |
|
"eval_overall_accuracy": 0.9502909796314258, |
|
"eval_overall_f1": 0.8010269576379975, |
|
"eval_overall_precision": 0.7222222222222222, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3508, |
|
"eval_samples_per_second": 533.007, |
|
"eval_steps_per_second": 8.551, |
|
"step": 2650 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.38709110021591187, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0732, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.7741935483870968, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7142857142857143, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7499999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.631578947368421, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.9259259259259259, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.9615384615384616, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14221937954425812, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8243064729194188, |
|
"eval_overall_precision": 0.7609756097560976, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3493, |
|
"eval_samples_per_second": 535.398, |
|
"eval_steps_per_second": 8.589, |
|
"step": 2756 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 0.5424766540527344, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0731, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7564102564102564, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6483516483516484, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.65, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5531914893617021, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.13665592670440674, |
|
"eval_overall_accuracy": 0.9556256062075654, |
|
"eval_overall_f1": 0.8184210526315788, |
|
"eval_overall_precision": 0.7530266343825666, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3499, |
|
"eval_samples_per_second": 534.475, |
|
"eval_steps_per_second": 8.574, |
|
"step": 2862 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 2.6486599445343018, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0697, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8026315789473684, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7530864197530864, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7160493827160493, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5979381443298969, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.9142857142857144, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8727272727272727, |
|
"eval_PERSON_recall": 0.96, |
|
"eval_QUANTITY_f1": 0.6329113924050633, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5434782608695652, |
|
"eval_QUANTITY_recall": 0.7575757575757576, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14497701823711395, |
|
"eval_overall_accuracy": 0.954898157129001, |
|
"eval_overall_f1": 0.8151041666666666, |
|
"eval_overall_precision": 0.7434679334916865, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3505, |
|
"eval_samples_per_second": 533.595, |
|
"eval_steps_per_second": 8.56, |
|
"step": 2968 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.7765714526176453, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0689, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7085714285714286, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5636363636363636, |
|
"eval_ORGANIZATION_recall": 0.9538461538461539, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.7936507936507937, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7142857142857143, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15288624167442322, |
|
"eval_overall_accuracy": 0.9553831231813773, |
|
"eval_overall_f1": 0.8097686375321336, |
|
"eval_overall_precision": 0.7308584686774942, |
|
"eval_overall_recall": 0.9077809798270894, |
|
"eval_runtime": 0.3501, |
|
"eval_samples_per_second": 534.16, |
|
"eval_steps_per_second": 8.569, |
|
"step": 3074 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.8394734263420105, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0669, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.7870967741935485, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7421383647798743, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6276595744680851, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.736842105263158, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6511627906976745, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8135593220338982, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7741935483870968, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14122405648231506, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8157894736842105, |
|
"eval_overall_precision": 0.7506053268765133, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3503, |
|
"eval_samples_per_second": 533.82, |
|
"eval_steps_per_second": 8.564, |
|
"step": 3180 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 0.43885117769241333, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0654, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.779874213836478, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7045454545454546, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7741935483870968, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6666666666666666, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.13700760900974274, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8227513227513227, |
|
"eval_overall_precision": 0.7603911980440098, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3506, |
|
"eval_samples_per_second": 533.416, |
|
"eval_steps_per_second": 8.557, |
|
"step": 3286 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.3841339647769928, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0639, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7108433734939759, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5841584158415841, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14966341853141785, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.81151832460733, |
|
"eval_overall_precision": 0.7434052757793765, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3501, |
|
"eval_samples_per_second": 534.13, |
|
"eval_steps_per_second": 8.569, |
|
"step": 3392 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.86671382188797, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0637, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.9009584664536742, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8650306748466258, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.7868852459016394, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7272727272727273, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.13783931732177734, |
|
"eval_overall_accuracy": 0.9597478176527643, |
|
"eval_overall_f1": 0.8213333333333332, |
|
"eval_overall_precision": 0.7642679900744417, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3499, |
|
"eval_samples_per_second": 534.488, |
|
"eval_steps_per_second": 8.575, |
|
"step": 3498 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 0.8965917229652405, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0625, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.8181818181818181, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7590361445783133, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.759493670886076, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6451612903225806, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.14487268030643463, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8333333333333334, |
|
"eval_overall_precision": 0.7701711491442543, |
|
"eval_overall_recall": 0.9077809798270894, |
|
"eval_runtime": 0.3507, |
|
"eval_samples_per_second": 533.265, |
|
"eval_steps_per_second": 8.555, |
|
"step": 3604 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 0.7054619193077087, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0634, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.7898089171974522, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7209302325581395, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7483870967741936, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6444444444444445, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.14537405967712402, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.821664464993395, |
|
"eval_overall_precision": 0.7585365853658537, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.35, |
|
"eval_samples_per_second": 534.224, |
|
"eval_steps_per_second": 8.57, |
|
"step": 3710 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 0.9769655466079712, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0592, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7672955974842768, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.648936170212766, |
|
"eval_ORGANIZATION_recall": 0.9384615384615385, |
|
"eval_PERSON_f1": 0.9067524115755627, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8757763975155279, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1611613929271698, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.8298429319371728, |
|
"eval_overall_precision": 0.7601918465227818, |
|
"eval_overall_recall": 0.9135446685878963, |
|
"eval_runtime": 0.3514, |
|
"eval_samples_per_second": 532.12, |
|
"eval_steps_per_second": 8.537, |
|
"step": 3816 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 0.828741192817688, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0597, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.7643312101910827, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.6976744186046512, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7439024390243902, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6161616161616161, |
|
"eval_ORGANIZATION_recall": 0.9384615384615385, |
|
"eval_PERSON_f1": 0.8974358974358974, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8641975308641975, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6666666666666666, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5777777777777777, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1625693291425705, |
|
"eval_overall_accuracy": 0.953443258971872, |
|
"eval_overall_f1": 0.8093385214007783, |
|
"eval_overall_precision": 0.7358490566037735, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3504, |
|
"eval_samples_per_second": 533.713, |
|
"eval_steps_per_second": 8.562, |
|
"step": 3922 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 1.4891364574432373, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0573, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8859934853420196, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8662420382165605, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7027027027027027, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6341463414634146, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1448131501674652, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8172043010752689, |
|
"eval_overall_precision": 0.7657430730478589, |
|
"eval_overall_recall": 0.8760806916426513, |
|
"eval_runtime": 0.3501, |
|
"eval_samples_per_second": 534.187, |
|
"eval_steps_per_second": 8.57, |
|
"step": 4028 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.5322253704071045, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0561, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.7870967741935485, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7261904761904762, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7643312101910829, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6521739130434783, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14745843410491943, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8243064729194188, |
|
"eval_overall_precision": 0.7609756097560976, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3508, |
|
"eval_samples_per_second": 533.023, |
|
"eval_steps_per_second": 8.551, |
|
"step": 4134 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 1.2674453258514404, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0521, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7169811320754718, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6063829787234043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8932038834951457, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7222222222222221, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6666666666666666, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.806451612903226, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7352941176470589, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14856770634651184, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8158940397350992, |
|
"eval_overall_precision": 0.7549019607843137, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3497, |
|
"eval_samples_per_second": 534.717, |
|
"eval_steps_per_second": 8.578, |
|
"step": 4240 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.23710742592811584, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0526, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.7792207792207793, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7228915662650602, |
|
"eval_LOCATION_recall": 0.8450704225352113, |
|
"eval_ORGANIZATION_f1": 0.7272727272727274, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.8846153846153846, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8518518518518519, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7272727272727273, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6363636363636364, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15941469371318817, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.8135593220338984, |
|
"eval_overall_precision": 0.7428571428571429, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3497, |
|
"eval_samples_per_second": 534.713, |
|
"eval_steps_per_second": 8.578, |
|
"step": 4346 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.5749427080154419, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0505, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.8533333333333334, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1528312712907791, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8317631224764469, |
|
"eval_overall_precision": 0.7803030303030303, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3505, |
|
"eval_samples_per_second": 533.466, |
|
"eval_steps_per_second": 8.558, |
|
"step": 4452 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.5371730923652649, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.0497, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.7721518987341772, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7011494252873564, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7006369426751592, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5978260869565217, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.14798860251903534, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8068331143232589, |
|
"eval_overall_precision": 0.7415458937198067, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3497, |
|
"eval_samples_per_second": 534.734, |
|
"eval_steps_per_second": 8.579, |
|
"step": 4558 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 0.9185490608215332, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.0525, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6933333333333334, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6190476190476191, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15042471885681152, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8243064729194188, |
|
"eval_overall_precision": 0.7609756097560976, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3507, |
|
"eval_samples_per_second": 533.267, |
|
"eval_steps_per_second": 8.555, |
|
"step": 4664 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 1.4481260776519775, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0486, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8289473684210527, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7777777777777778, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7236842105263158, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.632183908045977, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8996763754045306, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.14780230820178986, |
|
"eval_overall_accuracy": 0.9614451988360815, |
|
"eval_overall_f1": 0.8360215053763441, |
|
"eval_overall_precision": 0.783375314861461, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3493, |
|
"eval_samples_per_second": 535.387, |
|
"eval_steps_per_second": 8.589, |
|
"step": 4770 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.6384713053703308, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0454, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8311688311688312, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7272727272727273, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6292134831460674, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.732394366197183, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6842105263157895, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.819672131147541, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7575757575757576, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.14535315334796906, |
|
"eval_overall_accuracy": 0.9626576139670223, |
|
"eval_overall_f1": 0.8342245989304813, |
|
"eval_overall_precision": 0.7780548628428927, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3518, |
|
"eval_samples_per_second": 531.582, |
|
"eval_steps_per_second": 8.528, |
|
"step": 4876 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 3.3819124698638916, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.049, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.7922077922077921, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7349397590361446, |
|
"eval_LOCATION_recall": 0.8591549295774648, |
|
"eval_ORGANIZATION_f1": 0.7108433734939759, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5841584158415841, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15948139131069183, |
|
"eval_overall_accuracy": 0.9551406401551892, |
|
"eval_overall_f1": 0.8188976377952757, |
|
"eval_overall_precision": 0.7518072289156627, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3491, |
|
"eval_samples_per_second": 535.655, |
|
"eval_steps_per_second": 8.593, |
|
"step": 4982 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 0.692154049873352, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0467, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7272727272727273, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6292134831460674, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.9090909090909091, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8860759493670886, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8275862068965518, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8, |
|
"eval_TIME_recall": 0.8571428571428571, |
|
"eval_loss": 0.14814431965351105, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8255659121171772, |
|
"eval_overall_precision": 0.7673267326732673, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.35, |
|
"eval_samples_per_second": 534.257, |
|
"eval_steps_per_second": 8.571, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.21525277197360992, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0458, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7450980392156863, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6477272727272727, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9032258064516129, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.875, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7027027027027027, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6341463414634146, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15645316243171692, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8293333333333333, |
|
"eval_overall_precision": 0.771712158808933, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3516, |
|
"eval_samples_per_second": 531.919, |
|
"eval_steps_per_second": 8.533, |
|
"step": 5194 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 0.6371389031410217, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0435, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8258064516129031, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7105263157894737, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6206896551724138, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1588226705789566, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8266666666666667, |
|
"eval_overall_precision": 0.7692307692307693, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3498, |
|
"eval_samples_per_second": 534.657, |
|
"eval_steps_per_second": 8.577, |
|
"step": 5300 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.3768903613090515, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.0461, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.7974683544303797, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7241379310344828, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7044025157232704, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5957446808510638, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.16307169198989868, |
|
"eval_overall_accuracy": 0.9558680892337537, |
|
"eval_overall_f1": 0.8125819134993448, |
|
"eval_overall_precision": 0.7451923076923077, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3494, |
|
"eval_samples_per_second": 535.279, |
|
"eval_steps_per_second": 8.587, |
|
"step": 5406 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.7790448665618896, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0424, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8051948051948051, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7469879518072289, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7215189873417722, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6129032258064516, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9155844155844156, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8924050632911392, |
|
"eval_PERSON_recall": 0.94, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.17204023897647858, |
|
"eval_overall_accuracy": 0.9565955383123181, |
|
"eval_overall_f1": 0.8302387267904509, |
|
"eval_overall_precision": 0.769041769041769, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3508, |
|
"eval_samples_per_second": 533.066, |
|
"eval_steps_per_second": 8.552, |
|
"step": 5512 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.5764625072479248, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.0436, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.8025477707006369, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7325581395348837, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7142857142857142, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5825242718446602, |
|
"eval_ORGANIZATION_recall": 0.9230769230769231, |
|
"eval_PERSON_f1": 0.9102564102564102, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8765432098765432, |
|
"eval_PERSON_recall": 0.9466666666666667, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8387096774193549, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7647058823529411, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1814979910850525, |
|
"eval_overall_accuracy": 0.9529582929194956, |
|
"eval_overall_f1": 0.8195876288659794, |
|
"eval_overall_precision": 0.7412587412587412, |
|
"eval_overall_recall": 0.9164265129682997, |
|
"eval_runtime": 0.3501, |
|
"eval_samples_per_second": 534.111, |
|
"eval_steps_per_second": 8.569, |
|
"step": 5618 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.7614324688911438, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0414, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.823529411764706, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7354838709677419, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6333333333333333, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1521797627210617, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8315508021390374, |
|
"eval_overall_precision": 0.7755610972568578, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3503, |
|
"eval_samples_per_second": 533.843, |
|
"eval_steps_per_second": 8.564, |
|
"step": 5724 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 0.6456512212753296, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0413, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.8211920529801324, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.775, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7450980392156863, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6477272727272727, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.9019607843137256, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8846153846153846, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8771929824561403, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8620689655172413, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15478459000587463, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.834008097165992, |
|
"eval_overall_precision": 0.7842639593908629, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3506, |
|
"eval_samples_per_second": 533.435, |
|
"eval_steps_per_second": 8.558, |
|
"step": 5830 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 1.6711740493774414, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.04, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8496732026143791, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7926829268292683, |
|
"eval_LOCATION_recall": 0.9154929577464789, |
|
"eval_ORGANIZATION_f1": 0.728476821192053, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6395348837209303, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1626283824443817, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8337801608579088, |
|
"eval_overall_precision": 0.7794486215538847, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.35, |
|
"eval_samples_per_second": 534.232, |
|
"eval_steps_per_second": 8.571, |
|
"step": 5936 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 0.47535088658332825, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0416, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.823529411764706, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7432432432432433, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6626506024096386, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.6923076923076923, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.912280701754386, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.16426201164722443, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8299866131191432, |
|
"eval_overall_precision": 0.775, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3497, |
|
"eval_samples_per_second": 534.703, |
|
"eval_steps_per_second": 8.578, |
|
"step": 6042 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.42809298634529114, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0409, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8421052631578947, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7272727272727273, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6292134831460674, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8917197452229298, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.6835443037974683, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.5869565217391305, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.15997961163520813, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8269484808454426, |
|
"eval_overall_precision": 0.7634146341463415, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3495, |
|
"eval_samples_per_second": 535.11, |
|
"eval_steps_per_second": 8.585, |
|
"step": 6148 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 1.3752318620681763, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0392, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7380952380952381, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7297297297297298, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6506024096385542, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8831168831168831, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8607594936708861, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.912280701754386, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1547561138868332, |
|
"eval_overall_accuracy": 0.9599903006789525, |
|
"eval_overall_f1": 0.8232118758434548, |
|
"eval_overall_precision": 0.7741116751269036, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3499, |
|
"eval_samples_per_second": 534.45, |
|
"eval_steps_per_second": 8.574, |
|
"step": 6254 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.807634711265564, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0374, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.8476821192052981, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.8, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7417218543046358, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6511627906976745, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8932038834951457, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8928571428571429, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8928571428571429, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.15809109807014465, |
|
"eval_overall_accuracy": 0.9609602327837051, |
|
"eval_overall_f1": 0.8394062078272604, |
|
"eval_overall_precision": 0.7893401015228426, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3505, |
|
"eval_samples_per_second": 533.596, |
|
"eval_steps_per_second": 8.56, |
|
"step": 6360 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 0.2931790351867676, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.0365, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8421052631578947, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7515923566878981, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6413043478260869, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.912280701754386, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.16991622745990753, |
|
"eval_overall_accuracy": 0.9612027158098934, |
|
"eval_overall_f1": 0.8411214953271029, |
|
"eval_overall_precision": 0.7835820895522388, |
|
"eval_overall_recall": 0.9077809798270894, |
|
"eval_runtime": 0.3512, |
|
"eval_samples_per_second": 532.476, |
|
"eval_steps_per_second": 8.542, |
|
"step": 6466 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 0.6080542802810669, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0367, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.8441558441558441, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7831325301204819, |
|
"eval_LOCATION_recall": 0.9154929577464789, |
|
"eval_ORGANIZATION_f1": 0.738255033557047, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6547619047619048, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8859934853420196, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8662420382165605, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1723637729883194, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8317631224764469, |
|
"eval_overall_precision": 0.7803030303030303, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3492, |
|
"eval_samples_per_second": 535.569, |
|
"eval_steps_per_second": 8.592, |
|
"step": 6572 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 0.6744797825813293, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0365, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.8289473684210527, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7777777777777778, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7169811320754718, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6063829787234043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8802588996763754, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8553459119496856, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7671232876712328, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.16163378953933716, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8244680851063829, |
|
"eval_overall_precision": 0.7654320987654321, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3516, |
|
"eval_samples_per_second": 531.858, |
|
"eval_steps_per_second": 8.532, |
|
"step": 6678 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.468826025724411, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0355, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7534246575342466, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6790123456790124, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8817891373801918, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8466257668711656, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.17165683209896088, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.824, |
|
"eval_overall_precision": 0.7667493796526055, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3518, |
|
"eval_samples_per_second": 531.527, |
|
"eval_steps_per_second": 8.527, |
|
"step": 6784 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.1759960651397705, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0372, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.8258064516129031, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8938906752411575, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8633540372670807, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8666666666666666, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8125, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.16856727004051208, |
|
"eval_overall_accuracy": 0.9590203685741998, |
|
"eval_overall_f1": 0.8308921438082557, |
|
"eval_overall_precision": 0.7722772277227723, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3518, |
|
"eval_samples_per_second": 531.563, |
|
"eval_steps_per_second": 8.528, |
|
"step": 6890 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.6541854739189148, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0362, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.728395061728395, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6082474226804123, |
|
"eval_ORGANIZATION_recall": 0.9076923076923077, |
|
"eval_PERSON_f1": 0.8945686900958466, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8588957055214724, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.18290750682353973, |
|
"eval_overall_accuracy": 0.9561105722599418, |
|
"eval_overall_f1": 0.8241469816272966, |
|
"eval_overall_precision": 0.7566265060240964, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.3503, |
|
"eval_samples_per_second": 533.882, |
|
"eval_steps_per_second": 8.565, |
|
"step": 6996 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.5697064995765686, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.0333, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.823529411764706, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7388535031847134, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6304347826086957, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8996763754045306, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8742138364779874, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17202883958816528, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8320000000000001, |
|
"eval_overall_precision": 0.7741935483870968, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3506, |
|
"eval_samples_per_second": 533.421, |
|
"eval_steps_per_second": 8.558, |
|
"step": 7102 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 0.7047253251075745, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.033, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.8258064516129031, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7619047619047619, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7307692307692307, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6263736263736264, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8910256410256411, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8580246913580247, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.912280701754386, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.16683901846408844, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8313413014608233, |
|
"eval_overall_precision": 0.770935960591133, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3497, |
|
"eval_samples_per_second": 534.689, |
|
"eval_steps_per_second": 8.578, |
|
"step": 7208 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.8004153370857239, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0333, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8441558441558441, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7831325301204819, |
|
"eval_LOCATION_recall": 0.9154929577464789, |
|
"eval_ORGANIZATION_f1": 0.7261146496815286, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6195652173913043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7500000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6923076923076923, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1638197898864746, |
|
"eval_overall_accuracy": 0.9604752667313288, |
|
"eval_overall_f1": 0.8351063829787235, |
|
"eval_overall_precision": 0.7753086419753087, |
|
"eval_overall_recall": 0.9048991354466859, |
|
"eval_runtime": 0.3527, |
|
"eval_samples_per_second": 530.148, |
|
"eval_steps_per_second": 8.505, |
|
"step": 7314 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.29508113861083984, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0335, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.8496732026143791, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7926829268292683, |
|
"eval_LOCATION_recall": 0.9154929577464789, |
|
"eval_ORGANIZATION_f1": 0.75, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6551724137931034, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.17051611840724945, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8380187416331996, |
|
"eval_overall_precision": 0.7825, |
|
"eval_overall_recall": 0.9020172910662824, |
|
"eval_runtime": 0.3495, |
|
"eval_samples_per_second": 535.056, |
|
"eval_steps_per_second": 8.584, |
|
"step": 7420 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 1.538805365562439, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0353, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7080745341614907, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.59375, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8917197452229298, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8536585365853658, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19078566133975983, |
|
"eval_overall_accuracy": 0.9544131910766246, |
|
"eval_overall_f1": 0.814621409921671, |
|
"eval_overall_precision": 0.7446300715990454, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3503, |
|
"eval_samples_per_second": 533.879, |
|
"eval_steps_per_second": 8.565, |
|
"step": 7526 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.9210314750671387, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0324, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7236842105263158, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.632183908045977, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7945205479452054, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.725, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1728380173444748, |
|
"eval_overall_accuracy": 0.9602327837051406, |
|
"eval_overall_f1": 0.8277703604806409, |
|
"eval_overall_precision": 0.7711442786069652, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3513, |
|
"eval_samples_per_second": 532.244, |
|
"eval_steps_per_second": 8.539, |
|
"step": 7632 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 0.4661843776702881, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0323, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7388535031847134, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6304347826086957, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.896551724137931, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8666666666666667, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.17989809811115265, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8260292164674636, |
|
"eval_overall_precision": 0.7660098522167488, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3497, |
|
"eval_samples_per_second": 534.723, |
|
"eval_steps_per_second": 8.578, |
|
"step": 7738 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 1.6226832866668701, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0321, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8344370860927152, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.896774193548387, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.86875, |
|
"eval_PERSON_recall": 0.9266666666666666, |
|
"eval_QUANTITY_f1": 0.7012987012987013, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6136363636363636, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8620689655172413, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8333333333333334, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1787552833557129, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8277703604806409, |
|
"eval_overall_precision": 0.7711442786069652, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3512, |
|
"eval_samples_per_second": 532.488, |
|
"eval_steps_per_second": 8.543, |
|
"step": 7844 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.3848640024662018, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0296, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7320261437908497, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6363636363636364, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7837837837837839, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.7073170731707317, |
|
"eval_QUANTITY_recall": 0.8787878787878788, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18127557635307312, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.827127659574468, |
|
"eval_overall_precision": 0.7679012345679013, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3512, |
|
"eval_samples_per_second": 532.43, |
|
"eval_steps_per_second": 8.542, |
|
"step": 7950 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.07505329698324203, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0308, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.8344370860927152, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7875, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7169811320754718, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6063829787234043, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8888888888888887, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8717948717948718, |
|
"eval_PERSON_recall": 0.9066666666666666, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.17781808972358704, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8277703604806409, |
|
"eval_overall_precision": 0.7711442786069652, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3505, |
|
"eval_samples_per_second": 533.468, |
|
"eval_steps_per_second": 8.558, |
|
"step": 8056 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 1.183031439781189, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.0305, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8129032258064516, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.75, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7199999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6352941176470588, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7567567567567567, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6829268292682927, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.18227067589759827, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8262032085561497, |
|
"eval_overall_precision": 0.770573566084788, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3499, |
|
"eval_samples_per_second": 534.482, |
|
"eval_steps_per_second": 8.575, |
|
"step": 8162 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.4748055636882782, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0298, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.8387096774193548, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7738095238095238, |
|
"eval_LOCATION_recall": 0.9154929577464789, |
|
"eval_ORGANIZATION_f1": 0.7236842105263158, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.632183908045977, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8932038834951457, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.912280701754386, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.896551724137931, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1802036613225937, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8315508021390374, |
|
"eval_overall_precision": 0.7755610972568578, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3497, |
|
"eval_samples_per_second": 534.703, |
|
"eval_steps_per_second": 8.578, |
|
"step": 8268 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 1.2819609642028809, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0302, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.8205128205128205, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7529411764705882, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.728476821192053, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6395348837209303, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.90032154340836, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8695652173913043, |
|
"eval_PERSON_recall": 0.9333333333333333, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.18992583453655243, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8286852589641435, |
|
"eval_overall_precision": 0.7684729064039408, |
|
"eval_overall_recall": 0.899135446685879, |
|
"eval_runtime": 0.3507, |
|
"eval_samples_per_second": 533.193, |
|
"eval_steps_per_second": 8.554, |
|
"step": 8374 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 0.5597596168518066, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0307, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.8533333333333334, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.810126582278481, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7066666666666667, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6235294117647059, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8932038834951457, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8679245283018868, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.6842105263157895, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6046511627906976, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8524590163934426, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.7878787878787878, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.18140378594398499, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8230563002680964, |
|
"eval_overall_precision": 0.7694235588972431, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3504, |
|
"eval_samples_per_second": 533.729, |
|
"eval_steps_per_second": 8.562, |
|
"step": 8480 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.40338334441185, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0275, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8366013071895425, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7058823529411765, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6136363636363636, |
|
"eval_ORGANIZATION_recall": 0.8307692307692308, |
|
"eval_PERSON_f1": 0.896103896103896, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8734177215189873, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.18396371603012085, |
|
"eval_overall_accuracy": 0.9585354025218235, |
|
"eval_overall_f1": 0.8262032085561497, |
|
"eval_overall_precision": 0.770573566084788, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3499, |
|
"eval_samples_per_second": 534.509, |
|
"eval_steps_per_second": 8.575, |
|
"step": 8586 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 0.6464970111846924, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0285, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8496732026143791, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7926829268292683, |
|
"eval_LOCATION_recall": 0.9154929577464789, |
|
"eval_ORGANIZATION_f1": 0.7142857142857143, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6179775280898876, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18916206061840057, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8255659121171772, |
|
"eval_overall_precision": 0.7673267326732673, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3508, |
|
"eval_samples_per_second": 533.079, |
|
"eval_steps_per_second": 8.552, |
|
"step": 8692 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.22236359119415283, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0303, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.8366013071895425, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7804878048780488, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7051282051282052, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6043956043956044, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18220850825309753, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8207171314741034, |
|
"eval_overall_precision": 0.7610837438423645, |
|
"eval_overall_recall": 0.8904899135446686, |
|
"eval_runtime": 0.3506, |
|
"eval_samples_per_second": 533.426, |
|
"eval_steps_per_second": 8.558, |
|
"step": 8798 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.35181981325149536, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0291, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8076923076923077, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7411764705882353, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.6973684210526315, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6091954022988506, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.1842212826013565, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.8164893617021276, |
|
"eval_overall_precision": 0.7580246913580246, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3505, |
|
"eval_samples_per_second": 533.572, |
|
"eval_steps_per_second": 8.56, |
|
"step": 8904 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.7243216037750244, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0275, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8311688311688312, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.6883116883116883, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.5955056179775281, |
|
"eval_ORGANIZATION_recall": 0.8153846153846154, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8813559322033899, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8387096774193549, |
|
"eval_TIME_recall": 0.9285714285714286, |
|
"eval_loss": 0.18761229515075684, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8191489361702129, |
|
"eval_overall_precision": 0.7604938271604939, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3509, |
|
"eval_samples_per_second": 532.932, |
|
"eval_steps_per_second": 8.55, |
|
"step": 9010 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 0.5909172296524048, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0286, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8311688311688312, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7710843373493976, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7388535031847134, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6304347826086957, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8954248366013071, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8782051282051282, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1853346824645996, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8282290279627165, |
|
"eval_overall_precision": 0.7698019801980198, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3502, |
|
"eval_samples_per_second": 533.924, |
|
"eval_steps_per_second": 8.566, |
|
"step": 9116 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 0.7483916878700256, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0283, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8289473684210527, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7777777777777778, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7295597484276729, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6170212765957447, |
|
"eval_ORGANIZATION_recall": 0.8923076923076924, |
|
"eval_PERSON_f1": 0.8867313915857605, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8616352201257862, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1859874278306961, |
|
"eval_overall_accuracy": 0.9580504364694471, |
|
"eval_overall_f1": 0.8244680851063829, |
|
"eval_overall_precision": 0.7654320987654321, |
|
"eval_overall_recall": 0.8933717579250721, |
|
"eval_runtime": 0.3491, |
|
"eval_samples_per_second": 535.601, |
|
"eval_steps_per_second": 8.593, |
|
"step": 9222 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 0.6192948222160339, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0278, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8289473684210527, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7777777777777778, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.7354838709677419, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6333333333333333, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.8903225806451613, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8625, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7777777777777778, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.717948717948718, |
|
"eval_QUANTITY_recall": 0.8484848484848485, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.1810171753168106, |
|
"eval_overall_accuracy": 0.9592628516003879, |
|
"eval_overall_f1": 0.8315508021390374, |
|
"eval_overall_precision": 0.7755610972568578, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3504, |
|
"eval_samples_per_second": 533.64, |
|
"eval_steps_per_second": 8.561, |
|
"step": 9328 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 0.5605934858322144, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0277, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.8421052631578947, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7901234567901234, |
|
"eval_LOCATION_recall": 0.9014084507042254, |
|
"eval_ORGANIZATION_f1": 0.7124999999999999, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6, |
|
"eval_ORGANIZATION_recall": 0.8769230769230769, |
|
"eval_PERSON_f1": 0.887459807073955, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8571428571428571, |
|
"eval_PERSON_recall": 0.92, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18933603167533875, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.820580474934037, |
|
"eval_overall_precision": 0.7566909975669099, |
|
"eval_overall_recall": 0.8962536023054755, |
|
"eval_runtime": 0.3526, |
|
"eval_samples_per_second": 530.391, |
|
"eval_steps_per_second": 8.509, |
|
"step": 9434 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.2893717586994171, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0274, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7142857142857143, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6179775280898876, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8925081433224756, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8726114649681529, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7123287671232875, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18061868846416473, |
|
"eval_overall_accuracy": 0.9582929194956353, |
|
"eval_overall_f1": 0.8176943699731903, |
|
"eval_overall_precision": 0.7644110275689223, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3513, |
|
"eval_samples_per_second": 532.297, |
|
"eval_steps_per_second": 8.54, |
|
"step": 9540 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 0.9740373492240906, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0262, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.708860759493671, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6021505376344086, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7105263157894738, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.627906976744186, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18925167620182037, |
|
"eval_overall_accuracy": 0.95635305528613, |
|
"eval_overall_f1": 0.8100263852242744, |
|
"eval_overall_precision": 0.7469586374695864, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3493, |
|
"eval_samples_per_second": 535.417, |
|
"eval_steps_per_second": 8.59, |
|
"step": 9646 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.1865842491388321, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0263, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7466666666666668, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6588235294117647, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7123287671232875, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.65, |
|
"eval_QUANTITY_recall": 0.7878787878787878, |
|
"eval_TIME_f1": 0.8333333333333334, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.78125, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18539157509803772, |
|
"eval_overall_accuracy": 0.9587778855480117, |
|
"eval_overall_f1": 0.8203753351206434, |
|
"eval_overall_precision": 0.7669172932330827, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3492, |
|
"eval_samples_per_second": 535.496, |
|
"eval_steps_per_second": 8.591, |
|
"step": 9752 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 0.1964859962463379, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0253, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.823529411764706, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.713375796178344, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.189639613032341, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8158940397350992, |
|
"eval_overall_precision": 0.7549019607843137, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.351, |
|
"eval_samples_per_second": 532.764, |
|
"eval_steps_per_second": 8.547, |
|
"step": 9858 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.6065542101860046, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0246, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.713375796178344, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8766233766233766, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8544303797468354, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18659386038780212, |
|
"eval_overall_accuracy": 0.957807953443259, |
|
"eval_overall_f1": 0.8144192256341789, |
|
"eval_overall_precision": 0.7587064676616916, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3514, |
|
"eval_samples_per_second": 532.142, |
|
"eval_steps_per_second": 8.537, |
|
"step": 9964 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.47104644775390625, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0277, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.8104575163398693, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7560975609756098, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7368421052631579, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6436781609195402, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8737864077669903, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8490566037735849, |
|
"eval_PERSON_recall": 0.9, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18918968737125397, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.8155080213903744, |
|
"eval_overall_precision": 0.7605985037406484, |
|
"eval_overall_recall": 0.8789625360230547, |
|
"eval_runtime": 0.3518, |
|
"eval_samples_per_second": 531.589, |
|
"eval_steps_per_second": 8.528, |
|
"step": 10070 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 0.6074219346046448, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0261, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.717948717948718, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6153846153846154, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7397260273972603, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.675, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18794935941696167, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.8175765645805593, |
|
"eval_overall_precision": 0.7599009900990099, |
|
"eval_overall_recall": 0.8847262247838616, |
|
"eval_runtime": 0.3495, |
|
"eval_samples_per_second": 534.995, |
|
"eval_steps_per_second": 8.583, |
|
"step": 10176 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.5106649398803711, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.025, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.8157894736842104, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7654320987654321, |
|
"eval_LOCATION_recall": 0.8732394366197183, |
|
"eval_ORGANIZATION_f1": 0.7189542483660131, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.625, |
|
"eval_ORGANIZATION_recall": 0.8461538461538461, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18944178521633148, |
|
"eval_overall_accuracy": 0.9575654704170709, |
|
"eval_overall_f1": 0.816, |
|
"eval_overall_precision": 0.7593052109181141, |
|
"eval_overall_recall": 0.8818443804034583, |
|
"eval_runtime": 0.3495, |
|
"eval_samples_per_second": 535.094, |
|
"eval_steps_per_second": 8.584, |
|
"step": 10282 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 0.6887297034263611, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0257, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.823529411764706, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.713375796178344, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19144974648952484, |
|
"eval_overall_accuracy": 0.9570805043646945, |
|
"eval_overall_f1": 0.8148148148148148, |
|
"eval_overall_precision": 0.7530562347188264, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3502, |
|
"eval_samples_per_second": 533.939, |
|
"eval_steps_per_second": 8.566, |
|
"step": 10388 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.14230668544769287, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0274, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.823529411764706, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.713375796178344, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6086956521739131, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8810289389067525, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.8509316770186336, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7200000000000001, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6428571428571429, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.19010868668556213, |
|
"eval_overall_accuracy": 0.9568380213385063, |
|
"eval_overall_f1": 0.8158940397350992, |
|
"eval_overall_precision": 0.7549019607843137, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3511, |
|
"eval_samples_per_second": 532.588, |
|
"eval_steps_per_second": 8.544, |
|
"step": 10494 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 0.5434573292732239, |
|
"learning_rate": 0.0, |
|
"loss": 0.0256, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.823529411764706, |
|
"eval_LOCATION_number": 71, |
|
"eval_LOCATION_precision": 0.7682926829268293, |
|
"eval_LOCATION_recall": 0.8873239436619719, |
|
"eval_ORGANIZATION_f1": 0.717948717948718, |
|
"eval_ORGANIZATION_number": 65, |
|
"eval_ORGANIZATION_precision": 0.6153846153846154, |
|
"eval_ORGANIZATION_recall": 0.8615384615384616, |
|
"eval_PERSON_f1": 0.8782051282051282, |
|
"eval_PERSON_number": 150, |
|
"eval_PERSON_precision": 0.845679012345679, |
|
"eval_PERSON_recall": 0.9133333333333333, |
|
"eval_QUANTITY_f1": 0.7297297297297297, |
|
"eval_QUANTITY_number": 33, |
|
"eval_QUANTITY_precision": 0.6585365853658537, |
|
"eval_QUANTITY_recall": 0.8181818181818182, |
|
"eval_TIME_f1": 0.8474576271186439, |
|
"eval_TIME_number": 28, |
|
"eval_TIME_precision": 0.8064516129032258, |
|
"eval_TIME_recall": 0.8928571428571429, |
|
"eval_loss": 0.18971124291419983, |
|
"eval_overall_accuracy": 0.9573229873908826, |
|
"eval_overall_f1": 0.816976127320955, |
|
"eval_overall_precision": 0.7567567567567568, |
|
"eval_overall_recall": 0.8876080691642652, |
|
"eval_runtime": 0.3511, |
|
"eval_samples_per_second": 532.586, |
|
"eval_steps_per_second": 8.544, |
|
"step": 10600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 10600, |
|
"total_flos": 5123217774191952.0, |
|
"train_loss": 0.07423505819068765, |
|
"train_runtime": 606.268, |
|
"train_samples_per_second": 278.425, |
|
"train_steps_per_second": 17.484 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 10600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 5123217774191952.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|