|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 100.0, |
|
"eval_steps": 500, |
|
"global_step": 9600, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 1.569076418876648, |
|
"learning_rate": 4.9500000000000004e-05, |
|
"loss": 1.1639, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.0, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.0, |
|
"eval_PERSON_recall": 0.0, |
|
"eval_loss": 0.6982586979866028, |
|
"eval_overall_accuracy": 0.8373377520022093, |
|
"eval_overall_f1": 0.0, |
|
"eval_overall_precision": 0.0, |
|
"eval_overall_recall": 0.0, |
|
"eval_runtime": 0.5919, |
|
"eval_samples_per_second": 287.192, |
|
"eval_steps_per_second": 5.068, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 0.9749519228935242, |
|
"learning_rate": 4.9e-05, |
|
"loss": 0.6685, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.0, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.0, |
|
"eval_ORGANIZATION_recall": 0.0, |
|
"eval_PERSON_f1": 0.0, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.0, |
|
"eval_PERSON_recall": 0.0, |
|
"eval_loss": 0.565019428730011, |
|
"eval_overall_accuracy": 0.8376139188069595, |
|
"eval_overall_f1": 0.0, |
|
"eval_overall_precision": 0.0, |
|
"eval_overall_recall": 0.0, |
|
"eval_runtime": 0.6878, |
|
"eval_samples_per_second": 247.148, |
|
"eval_steps_per_second": 4.361, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 1.0692148208618164, |
|
"learning_rate": 4.85e-05, |
|
"loss": 0.553, |
|
"step": 288 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_LOCATION_f1": 0.0, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.0, |
|
"eval_LOCATION_recall": 0.0, |
|
"eval_ORGANIZATION_f1": 0.07407407407407407, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.3888888888888889, |
|
"eval_ORGANIZATION_recall": 0.04093567251461988, |
|
"eval_PERSON_f1": 0.10526315789473685, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.225, |
|
"eval_PERSON_recall": 0.06870229007633588, |
|
"eval_loss": 0.4425106644630432, |
|
"eval_overall_accuracy": 0.8470035901684617, |
|
"eval_overall_f1": 0.06866952789699571, |
|
"eval_overall_precision": 0.26229508196721313, |
|
"eval_overall_recall": 0.03950617283950617, |
|
"eval_runtime": 0.6213, |
|
"eval_samples_per_second": 273.628, |
|
"eval_steps_per_second": 4.829, |
|
"step": 288 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 0.8610777258872986, |
|
"learning_rate": 4.8e-05, |
|
"loss": 0.4403, |
|
"step": 384 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_LOCATION_f1": 0.078125, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.2, |
|
"eval_LOCATION_recall": 0.04854368932038835, |
|
"eval_ORGANIZATION_f1": 0.29078014184397166, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.36936936936936937, |
|
"eval_ORGANIZATION_recall": 0.23976608187134502, |
|
"eval_PERSON_f1": 0.4290657439446367, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.3924050632911392, |
|
"eval_PERSON_recall": 0.4732824427480916, |
|
"eval_loss": 0.33291852474212646, |
|
"eval_overall_accuracy": 0.8834576083954708, |
|
"eval_overall_f1": 0.3090128755364807, |
|
"eval_overall_precision": 0.3673469387755102, |
|
"eval_overall_recall": 0.26666666666666666, |
|
"eval_runtime": 0.6305, |
|
"eval_samples_per_second": 269.628, |
|
"eval_steps_per_second": 4.758, |
|
"step": 384 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 0.5931413769721985, |
|
"learning_rate": 4.75e-05, |
|
"loss": 0.3288, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_LOCATION_f1": 0.3715846994535519, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.425, |
|
"eval_LOCATION_recall": 0.3300970873786408, |
|
"eval_ORGANIZATION_f1": 0.5683646112600537, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.5247524752475248, |
|
"eval_ORGANIZATION_recall": 0.6198830409356725, |
|
"eval_PERSON_f1": 0.6107382550335572, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.5449101796407185, |
|
"eval_PERSON_recall": 0.6946564885496184, |
|
"eval_loss": 0.24550960958003998, |
|
"eval_overall_accuracy": 0.9262634631317316, |
|
"eval_overall_f1": 0.540983606557377, |
|
"eval_overall_precision": 0.5144766146993318, |
|
"eval_overall_recall": 0.5703703703703704, |
|
"eval_runtime": 0.6072, |
|
"eval_samples_per_second": 279.961, |
|
"eval_steps_per_second": 4.94, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 1.293260097503662, |
|
"learning_rate": 4.7e-05, |
|
"loss": 0.2474, |
|
"step": 576 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_LOCATION_f1": 0.626865671641791, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.6428571428571429, |
|
"eval_LOCATION_recall": 0.6116504854368932, |
|
"eval_ORGANIZATION_f1": 0.6863270777479892, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.6336633663366337, |
|
"eval_ORGANIZATION_recall": 0.7485380116959064, |
|
"eval_PERSON_f1": 0.833922261484099, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.7763157894736842, |
|
"eval_PERSON_recall": 0.9007633587786259, |
|
"eval_loss": 0.18931446969509125, |
|
"eval_overall_accuracy": 0.9505661419497377, |
|
"eval_overall_f1": 0.721120186697783, |
|
"eval_overall_precision": 0.6836283185840708, |
|
"eval_overall_recall": 0.762962962962963, |
|
"eval_runtime": 0.5962, |
|
"eval_samples_per_second": 285.148, |
|
"eval_steps_per_second": 5.032, |
|
"step": 576 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 1.2653672695159912, |
|
"learning_rate": 4.6500000000000005e-05, |
|
"loss": 0.1962, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_LOCATION_f1": 0.7551020408163266, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.7956989247311828, |
|
"eval_LOCATION_recall": 0.7184466019417476, |
|
"eval_ORGANIZATION_f1": 0.7526881720430108, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.6965174129353234, |
|
"eval_ORGANIZATION_recall": 0.8187134502923976, |
|
"eval_PERSON_f1": 0.9157509157509158, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.8802816901408451, |
|
"eval_PERSON_recall": 0.9541984732824428, |
|
"eval_loss": 0.1533629298210144, |
|
"eval_overall_accuracy": 0.9605081469207402, |
|
"eval_overall_f1": 0.8061831153388822, |
|
"eval_overall_precision": 0.7775229357798165, |
|
"eval_overall_recall": 0.837037037037037, |
|
"eval_runtime": 0.5884, |
|
"eval_samples_per_second": 288.903, |
|
"eval_steps_per_second": 5.098, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.9401953816413879, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.1659, |
|
"step": 768 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_LOCATION_f1": 0.7980295566502462, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.81, |
|
"eval_LOCATION_recall": 0.7864077669902912, |
|
"eval_ORGANIZATION_f1": 0.7899159663865545, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.7580645161290323, |
|
"eval_ORGANIZATION_recall": 0.8245614035087719, |
|
"eval_PERSON_f1": 0.9328358208955224, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9124087591240876, |
|
"eval_PERSON_recall": 0.9541984732824428, |
|
"eval_loss": 0.12766310572624207, |
|
"eval_overall_accuracy": 0.9652029826014913, |
|
"eval_overall_f1": 0.8381642512077295, |
|
"eval_overall_precision": 0.8203309692671394, |
|
"eval_overall_recall": 0.8567901234567902, |
|
"eval_runtime": 0.5896, |
|
"eval_samples_per_second": 288.354, |
|
"eval_steps_per_second": 5.089, |
|
"step": 768 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 1.0895642042160034, |
|
"learning_rate": 4.55e-05, |
|
"loss": 0.1495, |
|
"step": 864 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_LOCATION_f1": 0.835820895522388, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8571428571428571, |
|
"eval_LOCATION_recall": 0.8155339805825242, |
|
"eval_ORGANIZATION_f1": 0.8099173553719009, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.765625, |
|
"eval_ORGANIZATION_recall": 0.8596491228070176, |
|
"eval_PERSON_f1": 0.9338235294117646, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.900709219858156, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.11188717931509018, |
|
"eval_overall_accuracy": 0.9690693178679922, |
|
"eval_overall_f1": 0.8564593301435406, |
|
"eval_overall_precision": 0.8306264501160093, |
|
"eval_overall_recall": 0.8839506172839506, |
|
"eval_runtime": 0.6012, |
|
"eval_samples_per_second": 282.766, |
|
"eval_steps_per_second": 4.99, |
|
"step": 864 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"grad_norm": 1.217275857925415, |
|
"learning_rate": 4.5e-05, |
|
"loss": 0.1342, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_LOCATION_f1": 0.8374384236453202, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.85, |
|
"eval_LOCATION_recall": 0.8252427184466019, |
|
"eval_ORGANIZATION_f1": 0.8277777777777778, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.7883597883597884, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.929889298892989, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.10086647421121597, |
|
"eval_overall_accuracy": 0.9707263186964927, |
|
"eval_overall_f1": 0.8633093525179856, |
|
"eval_overall_precision": 0.8391608391608392, |
|
"eval_overall_recall": 0.8888888888888888, |
|
"eval_runtime": 0.6119, |
|
"eval_samples_per_second": 277.843, |
|
"eval_steps_per_second": 4.903, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"grad_norm": 2.0349202156066895, |
|
"learning_rate": 4.4500000000000004e-05, |
|
"loss": 0.1241, |
|
"step": 1056 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_LOCATION_f1": 0.8365384615384616, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8285714285714286, |
|
"eval_LOCATION_recall": 0.8446601941747572, |
|
"eval_ORGANIZATION_f1": 0.8342857142857143, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8156424581005587, |
|
"eval_ORGANIZATION_recall": 0.8538011695906432, |
|
"eval_PERSON_f1": 0.9438202247191011, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9264705882352942, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.09149681031703949, |
|
"eval_overall_accuracy": 0.9726594863297432, |
|
"eval_overall_f1": 0.8703030303030304, |
|
"eval_overall_precision": 0.8547619047619047, |
|
"eval_overall_recall": 0.8864197530864197, |
|
"eval_runtime": 0.5981, |
|
"eval_samples_per_second": 284.231, |
|
"eval_steps_per_second": 5.016, |
|
"step": 1056 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"grad_norm": 3.014051914215088, |
|
"learning_rate": 4.4000000000000006e-05, |
|
"loss": 0.1188, |
|
"step": 1152 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_LOCATION_f1": 0.8309178743961353, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8269230769230769, |
|
"eval_LOCATION_recall": 0.8349514563106796, |
|
"eval_ORGANIZATION_f1": 0.8579545454545455, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8342541436464088, |
|
"eval_ORGANIZATION_recall": 0.8830409356725146, |
|
"eval_PERSON_f1": 0.9402985074626866, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9197080291970803, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.08539355546236038, |
|
"eval_overall_accuracy": 0.9745926539629937, |
|
"eval_overall_f1": 0.8778718258766627, |
|
"eval_overall_precision": 0.8601895734597157, |
|
"eval_overall_recall": 0.8962962962962963, |
|
"eval_runtime": 0.5994, |
|
"eval_samples_per_second": 283.636, |
|
"eval_steps_per_second": 5.005, |
|
"step": 1152 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"grad_norm": 2.8539180755615234, |
|
"learning_rate": 4.35e-05, |
|
"loss": 0.1102, |
|
"step": 1248 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_LOCATION_f1": 0.8695652173913043, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8653846153846154, |
|
"eval_LOCATION_recall": 0.8737864077669902, |
|
"eval_ORGANIZATION_f1": 0.866096866096866, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8444444444444444, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9473684210526315, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9333333333333333, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.07981602847576141, |
|
"eval_overall_accuracy": 0.9762496547914941, |
|
"eval_overall_f1": 0.8932038834951457, |
|
"eval_overall_precision": 0.8782816229116945, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.598, |
|
"eval_samples_per_second": 284.265, |
|
"eval_steps_per_second": 5.016, |
|
"step": 1248 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"grad_norm": 0.624473512172699, |
|
"learning_rate": 4.3e-05, |
|
"loss": 0.1044, |
|
"step": 1344 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_LOCATION_f1": 0.8768472906403941, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.89, |
|
"eval_LOCATION_recall": 0.8640776699029126, |
|
"eval_ORGANIZATION_f1": 0.8830409356725146, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8830409356725146, |
|
"eval_ORGANIZATION_recall": 0.8830409356725146, |
|
"eval_PERSON_f1": 0.9509433962264152, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9402985074626866, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.07802519202232361, |
|
"eval_overall_accuracy": 0.9781828224247445, |
|
"eval_overall_f1": 0.9037037037037037, |
|
"eval_overall_precision": 0.9037037037037037, |
|
"eval_overall_recall": 0.9037037037037037, |
|
"eval_runtime": 0.5951, |
|
"eval_samples_per_second": 285.656, |
|
"eval_steps_per_second": 5.041, |
|
"step": 1344 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"grad_norm": 0.996662437915802, |
|
"learning_rate": 4.25e-05, |
|
"loss": 0.1009, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_LOCATION_f1": 0.891089108910891, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.9090909090909091, |
|
"eval_LOCATION_recall": 0.8737864077669902, |
|
"eval_ORGANIZATION_f1": 0.8788732394366197, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8478260869565217, |
|
"eval_ORGANIZATION_recall": 0.9122807017543859, |
|
"eval_PERSON_f1": 0.9584905660377357, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9477611940298507, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.07211567461490631, |
|
"eval_overall_accuracy": 0.9781828224247445, |
|
"eval_overall_f1": 0.9075425790754258, |
|
"eval_overall_precision": 0.894484412470024, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.5925, |
|
"eval_samples_per_second": 286.903, |
|
"eval_steps_per_second": 5.063, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"grad_norm": 1.0493874549865723, |
|
"learning_rate": 4.2e-05, |
|
"loss": 0.0978, |
|
"step": 1536 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_LOCATION_f1": 0.8932038834951457, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8932038834951457, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8725212464589235, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8461538461538461, |
|
"eval_ORGANIZATION_recall": 0.9005847953216374, |
|
"eval_PERSON_f1": 0.9509433962264152, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9402985074626866, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.06955698877573013, |
|
"eval_overall_accuracy": 0.9779066556199945, |
|
"eval_overall_f1": 0.9029126213592233, |
|
"eval_overall_precision": 0.8878281622911695, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.6569, |
|
"eval_samples_per_second": 258.806, |
|
"eval_steps_per_second": 4.567, |
|
"step": 1536 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"grad_norm": 0.8617897629737854, |
|
"learning_rate": 4.15e-05, |
|
"loss": 0.0962, |
|
"step": 1632 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_LOCATION_f1": 0.9064039408866995, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.92, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8869565217391304, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8793103448275862, |
|
"eval_ORGANIZATION_recall": 0.8947368421052632, |
|
"eval_PERSON_f1": 0.962121212121212, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9548872180451128, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.06796535849571228, |
|
"eval_overall_accuracy": 0.980115990057995, |
|
"eval_overall_f1": 0.916256157635468, |
|
"eval_overall_precision": 0.914004914004914, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.6013, |
|
"eval_samples_per_second": 282.726, |
|
"eval_steps_per_second": 4.989, |
|
"step": 1632 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"grad_norm": 0.8590739965438843, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.0909, |
|
"step": 1728 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_LOCATION_f1": 0.896551724137931, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.91, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.8831908831908832, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8611111111111112, |
|
"eval_ORGANIZATION_recall": 0.9064327485380117, |
|
"eval_PERSON_f1": 0.9509433962264152, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9402985074626866, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.0644010454416275, |
|
"eval_overall_accuracy": 0.9798398232532449, |
|
"eval_overall_f1": 0.9084249084249084, |
|
"eval_overall_precision": 0.8985507246376812, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.5942, |
|
"eval_samples_per_second": 286.117, |
|
"eval_steps_per_second": 5.049, |
|
"step": 1728 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"grad_norm": 2.493396520614624, |
|
"learning_rate": 4.05e-05, |
|
"loss": 0.088, |
|
"step": 1824 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_LOCATION_f1": 0.9009900990099011, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.9191919191919192, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.8908045977011494, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8757062146892656, |
|
"eval_ORGANIZATION_recall": 0.9064327485380117, |
|
"eval_PERSON_f1": 0.9545454545454546, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9473684210526315, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.0634172335267067, |
|
"eval_overall_accuracy": 0.9806683236674951, |
|
"eval_overall_f1": 0.914004914004914, |
|
"eval_overall_precision": 0.9095354523227384, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.5943, |
|
"eval_samples_per_second": 286.044, |
|
"eval_steps_per_second": 5.048, |
|
"step": 1824 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"grad_norm": 0.5532075762748718, |
|
"learning_rate": 4e-05, |
|
"loss": 0.0836, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_LOCATION_f1": 0.8888888888888888, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8846153846153846, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8863636363636364, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.861878453038674, |
|
"eval_ORGANIZATION_recall": 0.9122807017543859, |
|
"eval_PERSON_f1": 0.9509433962264152, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9402985074626866, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.06357116252183914, |
|
"eval_overall_accuracy": 0.9798398232532449, |
|
"eval_overall_f1": 0.9077669902912622, |
|
"eval_overall_precision": 0.8926014319809069, |
|
"eval_overall_recall": 0.9234567901234568, |
|
"eval_runtime": 0.5958, |
|
"eval_samples_per_second": 285.346, |
|
"eval_steps_per_second": 5.036, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"grad_norm": 1.6820136308670044, |
|
"learning_rate": 3.9500000000000005e-05, |
|
"loss": 0.0836, |
|
"step": 2016 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_LOCATION_f1": 0.8888888888888888, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8846153846153846, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8760806916426512, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8636363636363636, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9545454545454546, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9473684210526315, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.05993271991610527, |
|
"eval_overall_accuracy": 0.9806683236674951, |
|
"eval_overall_f1": 0.9046454767726161, |
|
"eval_overall_precision": 0.8958837772397095, |
|
"eval_overall_recall": 0.9135802469135802, |
|
"eval_runtime": 0.5978, |
|
"eval_samples_per_second": 284.362, |
|
"eval_steps_per_second": 5.018, |
|
"step": 2016 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"grad_norm": 0.9439449906349182, |
|
"learning_rate": 3.9000000000000006e-05, |
|
"loss": 0.0827, |
|
"step": 2112 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_LOCATION_f1": 0.8761904761904761, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8598130841121495, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8757062146892655, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8469945355191257, |
|
"eval_ORGANIZATION_recall": 0.9064327485380117, |
|
"eval_PERSON_f1": 0.9509433962264152, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9402985074626866, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.05957403779029846, |
|
"eval_overall_accuracy": 0.9798398232532449, |
|
"eval_overall_f1": 0.8998793727382389, |
|
"eval_overall_precision": 0.8797169811320755, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.5967, |
|
"eval_samples_per_second": 284.901, |
|
"eval_steps_per_second": 5.028, |
|
"step": 2112 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"grad_norm": 1.140651822090149, |
|
"learning_rate": 3.85e-05, |
|
"loss": 0.077, |
|
"step": 2208 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_LOCATION_f1": 0.8750000000000001, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8666666666666667, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.8818443804034583, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8693181818181818, |
|
"eval_ORGANIZATION_recall": 0.8947368421052632, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.058286890387535095, |
|
"eval_overall_accuracy": 0.9806683236674951, |
|
"eval_overall_f1": 0.9070904645476773, |
|
"eval_overall_precision": 0.8983050847457628, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.6001, |
|
"eval_samples_per_second": 283.301, |
|
"eval_steps_per_second": 4.999, |
|
"step": 2208 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"grad_norm": 0.9434022307395935, |
|
"learning_rate": 3.8e-05, |
|
"loss": 0.0774, |
|
"step": 2304 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_LOCATION_f1": 0.861111111111111, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8230088495575221, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8529411764705882, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8579881656804734, |
|
"eval_ORGANIZATION_recall": 0.847953216374269, |
|
"eval_PERSON_f1": 0.9545454545454546, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9473684210526315, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.05800532177090645, |
|
"eval_overall_accuracy": 0.9787351560342447, |
|
"eval_overall_f1": 0.8878048780487805, |
|
"eval_overall_precision": 0.8771084337349397, |
|
"eval_overall_recall": 0.8987654320987655, |
|
"eval_runtime": 0.6032, |
|
"eval_samples_per_second": 281.813, |
|
"eval_steps_per_second": 4.973, |
|
"step": 2304 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"grad_norm": 1.0291742086410522, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0782, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_LOCATION_f1": 0.8792270531400966, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.875, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.8816568047337278, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8922155688622755, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9545454545454546, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9473684210526315, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.05705862119793892, |
|
"eval_overall_accuracy": 0.9798398232532449, |
|
"eval_overall_f1": 0.9048207663782447, |
|
"eval_overall_precision": 0.905940594059406, |
|
"eval_overall_recall": 0.9037037037037037, |
|
"eval_runtime": 0.6018, |
|
"eval_samples_per_second": 282.474, |
|
"eval_steps_per_second": 4.985, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"grad_norm": 0.6928281784057617, |
|
"learning_rate": 3.7e-05, |
|
"loss": 0.0771, |
|
"step": 2496 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_LOCATION_f1": 0.8975609756097561, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.9019607843137255, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8977272727272728, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8729281767955801, |
|
"eval_ORGANIZATION_recall": 0.9239766081871345, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.055970560759305954, |
|
"eval_overall_accuracy": 0.9820491576912456, |
|
"eval_overall_f1": 0.9195121951219513, |
|
"eval_overall_precision": 0.908433734939759, |
|
"eval_overall_recall": 0.9308641975308642, |
|
"eval_runtime": 0.6049, |
|
"eval_samples_per_second": 281.02, |
|
"eval_steps_per_second": 4.959, |
|
"step": 2496 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"grad_norm": 1.4192240238189697, |
|
"learning_rate": 3.65e-05, |
|
"loss": 0.0726, |
|
"step": 2592 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_LOCATION_f1": 0.9064039408866995, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.92, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.9008498583569404, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8736263736263736, |
|
"eval_ORGANIZATION_recall": 0.9298245614035088, |
|
"eval_PERSON_f1": 0.9545454545454546, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9473684210526315, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.05344228819012642, |
|
"eval_overall_accuracy": 0.9826014913007457, |
|
"eval_overall_f1": 0.9195121951219513, |
|
"eval_overall_precision": 0.908433734939759, |
|
"eval_overall_recall": 0.9308641975308642, |
|
"eval_runtime": 0.605, |
|
"eval_samples_per_second": 281.0, |
|
"eval_steps_per_second": 4.959, |
|
"step": 2592 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"grad_norm": 1.0541571378707886, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.0712, |
|
"step": 2688 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_LOCATION_f1": 0.8932038834951457, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8932038834951457, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8939828080229225, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8764044943820225, |
|
"eval_ORGANIZATION_recall": 0.9122807017543859, |
|
"eval_PERSON_f1": 0.9545454545454546, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9473684210526315, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.05282684788107872, |
|
"eval_overall_accuracy": 0.9826014913007457, |
|
"eval_overall_f1": 0.9133089133089134, |
|
"eval_overall_precision": 0.9033816425120773, |
|
"eval_overall_recall": 0.9234567901234568, |
|
"eval_runtime": 0.6016, |
|
"eval_samples_per_second": 282.587, |
|
"eval_steps_per_second": 4.987, |
|
"step": 2688 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"grad_norm": 0.6951781511306763, |
|
"learning_rate": 3.55e-05, |
|
"loss": 0.0703, |
|
"step": 2784 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_LOCATION_f1": 0.9009900990099011, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.9191919191919192, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.9008498583569404, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8736263736263736, |
|
"eval_ORGANIZATION_recall": 0.9298245614035088, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.05054891109466553, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.9217603911980441, |
|
"eval_overall_precision": 0.9128329297820823, |
|
"eval_overall_recall": 0.9308641975308642, |
|
"eval_runtime": 0.5939, |
|
"eval_samples_per_second": 286.258, |
|
"eval_steps_per_second": 5.052, |
|
"step": 2784 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"grad_norm": 0.4239547550678253, |
|
"learning_rate": 3.5e-05, |
|
"loss": 0.0649, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_LOCATION_f1": 0.9054726368159205, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.9285714285714286, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.9065155807365438, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8791208791208791, |
|
"eval_ORGANIZATION_recall": 0.935672514619883, |
|
"eval_PERSON_f1": 0.9545454545454546, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9473684210526315, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.05008954927325249, |
|
"eval_overall_accuracy": 0.983706158519746, |
|
"eval_overall_f1": 0.9217603911980441, |
|
"eval_overall_precision": 0.9128329297820823, |
|
"eval_overall_recall": 0.9308641975308642, |
|
"eval_runtime": 0.606, |
|
"eval_samples_per_second": 280.539, |
|
"eval_steps_per_second": 4.951, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"grad_norm": 1.2522234916687012, |
|
"learning_rate": 3.45e-05, |
|
"loss": 0.0642, |
|
"step": 2976 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_LOCATION_f1": 0.8720379146919431, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8518518518518519, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8786127167630058, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8685714285714285, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.05007793754339218, |
|
"eval_overall_accuracy": 0.9820491576912456, |
|
"eval_overall_f1": 0.9048780487804877, |
|
"eval_overall_precision": 0.8939759036144578, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.5983, |
|
"eval_samples_per_second": 284.148, |
|
"eval_steps_per_second": 5.014, |
|
"step": 2976 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"grad_norm": 0.8345080018043518, |
|
"learning_rate": 3.4000000000000007e-05, |
|
"loss": 0.0664, |
|
"step": 3072 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_LOCATION_f1": 0.8625592417061612, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8425925925925926, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.8835820895522388, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.9024390243902439, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9545454545454546, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9473684210526315, |
|
"eval_PERSON_recall": 0.9618320610687023, |
|
"eval_loss": 0.05058050900697708, |
|
"eval_overall_accuracy": 0.9817729908864954, |
|
"eval_overall_f1": 0.9012345679012346, |
|
"eval_overall_precision": 0.9012345679012346, |
|
"eval_overall_recall": 0.9012345679012346, |
|
"eval_runtime": 0.6023, |
|
"eval_samples_per_second": 282.266, |
|
"eval_steps_per_second": 4.981, |
|
"step": 3072 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"grad_norm": 0.7092554569244385, |
|
"learning_rate": 3.35e-05, |
|
"loss": 0.0659, |
|
"step": 3168 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_LOCATION_f1": 0.8584905660377358, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8348623853211009, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.8842729970326408, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8975903614457831, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.0509335920214653, |
|
"eval_overall_accuracy": 0.9820491576912456, |
|
"eval_overall_f1": 0.9039408866995073, |
|
"eval_overall_precision": 0.9017199017199017, |
|
"eval_overall_recall": 0.9061728395061729, |
|
"eval_runtime": 0.5971, |
|
"eval_samples_per_second": 284.704, |
|
"eval_steps_per_second": 5.024, |
|
"step": 3168 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"grad_norm": 0.8459410071372986, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0667, |
|
"step": 3264 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_LOCATION_f1": 0.883495145631068, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.883495145631068, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.8908045977011494, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8757062146892656, |
|
"eval_ORGANIZATION_recall": 0.9064327485380117, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.050714682787656784, |
|
"eval_overall_accuracy": 0.9826014913007457, |
|
"eval_overall_f1": 0.9130966952264382, |
|
"eval_overall_precision": 0.9053398058252428, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.5977, |
|
"eval_samples_per_second": 284.432, |
|
"eval_steps_per_second": 5.019, |
|
"step": 3264 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"grad_norm": 1.9158438444137573, |
|
"learning_rate": 3.2500000000000004e-05, |
|
"loss": 0.0639, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_LOCATION_f1": 0.8761904761904761, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8598130841121495, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8934911242603552, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.9041916167664671, |
|
"eval_ORGANIZATION_recall": 0.8830409356725146, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.0509558841586113, |
|
"eval_overall_accuracy": 0.9826014913007457, |
|
"eval_overall_f1": 0.9124537607891491, |
|
"eval_overall_precision": 0.9113300492610837, |
|
"eval_overall_recall": 0.9135802469135802, |
|
"eval_runtime": 0.6048, |
|
"eval_samples_per_second": 281.07, |
|
"eval_steps_per_second": 4.96, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"grad_norm": 1.0001205205917358, |
|
"learning_rate": 3.2000000000000005e-05, |
|
"loss": 0.0632, |
|
"step": 3456 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_LOCATION_f1": 0.8846153846153847, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8761904761904762, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.9032258064516129, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.9058823529411765, |
|
"eval_ORGANIZATION_recall": 0.9005847953216374, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.050493232905864716, |
|
"eval_overall_accuracy": 0.983706158519746, |
|
"eval_overall_f1": 0.91871921182266, |
|
"eval_overall_precision": 0.9164619164619164, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.5977, |
|
"eval_samples_per_second": 284.414, |
|
"eval_steps_per_second": 5.019, |
|
"step": 3456 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"grad_norm": 2.2751259803771973, |
|
"learning_rate": 3.15e-05, |
|
"loss": 0.0632, |
|
"step": 3552 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_LOCATION_f1": 0.9054726368159205, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.9285714285714286, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.9132947976878613, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.9028571428571428, |
|
"eval_ORGANIZATION_recall": 0.9239766081871345, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04872192069888115, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.928395061728395, |
|
"eval_overall_precision": 0.928395061728395, |
|
"eval_overall_recall": 0.928395061728395, |
|
"eval_runtime": 0.5916, |
|
"eval_samples_per_second": 287.366, |
|
"eval_steps_per_second": 5.071, |
|
"step": 3552 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"grad_norm": 0.6949302554130554, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.0605, |
|
"step": 3648 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_LOCATION_f1": 0.8803827751196173, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8679245283018868, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8922155688622756, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.9141104294478528, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.05016703903675079, |
|
"eval_overall_accuracy": 0.9831538249102458, |
|
"eval_overall_f1": 0.913151364764268, |
|
"eval_overall_precision": 0.9177057356608479, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.5914, |
|
"eval_samples_per_second": 287.442, |
|
"eval_steps_per_second": 5.073, |
|
"step": 3648 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"grad_norm": 0.5452874302864075, |
|
"learning_rate": 3.05e-05, |
|
"loss": 0.0609, |
|
"step": 3744 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_LOCATION_f1": 0.8803827751196173, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8679245283018868, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8953488372093024, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8901734104046243, |
|
"eval_ORGANIZATION_recall": 0.9005847953216374, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.046954866498708725, |
|
"eval_overall_accuracy": 0.9842584921292461, |
|
"eval_overall_f1": 0.9142156862745098, |
|
"eval_overall_precision": 0.9075425790754258, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.6085, |
|
"eval_samples_per_second": 279.378, |
|
"eval_steps_per_second": 4.93, |
|
"step": 3744 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"grad_norm": 2.737624406814575, |
|
"learning_rate": 3e-05, |
|
"loss": 0.0601, |
|
"step": 3840 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_LOCATION_f1": 0.8878048780487806, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8921568627450981, |
|
"eval_LOCATION_recall": 0.883495145631068, |
|
"eval_ORGANIZATION_f1": 0.9032258064516129, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.9058823529411765, |
|
"eval_ORGANIZATION_recall": 0.9005847953216374, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.046938493847846985, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.919653893695921, |
|
"eval_overall_precision": 0.9207920792079208, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.5981, |
|
"eval_samples_per_second": 284.253, |
|
"eval_steps_per_second": 5.016, |
|
"step": 3840 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"grad_norm": 0.9197700619697571, |
|
"learning_rate": 2.95e-05, |
|
"loss": 0.0588, |
|
"step": 3936 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_LOCATION_f1": 0.9064039408866995, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.92, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.9137931034482759, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8983050847457628, |
|
"eval_ORGANIZATION_recall": 0.9298245614035088, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04637211561203003, |
|
"eval_overall_accuracy": 0.9864678265672466, |
|
"eval_overall_f1": 0.9287469287469288, |
|
"eval_overall_precision": 0.9242053789731052, |
|
"eval_overall_recall": 0.9333333333333333, |
|
"eval_runtime": 0.5998, |
|
"eval_samples_per_second": 283.424, |
|
"eval_steps_per_second": 5.002, |
|
"step": 3936 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"grad_norm": 0.33734437823295593, |
|
"learning_rate": 2.9e-05, |
|
"loss": 0.0576, |
|
"step": 4032 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_LOCATION_f1": 0.9064039408866995, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.92, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.9111747851002865, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8932584269662921, |
|
"eval_ORGANIZATION_recall": 0.9298245614035088, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04518849030137062, |
|
"eval_overall_accuracy": 0.9870201601767468, |
|
"eval_overall_f1": 0.9276073619631902, |
|
"eval_overall_precision": 0.9219512195121952, |
|
"eval_overall_recall": 0.9333333333333333, |
|
"eval_runtime": 0.5992, |
|
"eval_samples_per_second": 283.689, |
|
"eval_steps_per_second": 5.006, |
|
"step": 4032 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"grad_norm": 0.9250084757804871, |
|
"learning_rate": 2.8499999999999998e-05, |
|
"loss": 0.057, |
|
"step": 4128 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_LOCATION_f1": 0.8803827751196173, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8679245283018868, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8941176470588235, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8994082840236687, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04571167007088661, |
|
"eval_overall_accuracy": 0.9853631593482464, |
|
"eval_overall_f1": 0.9137931034482758, |
|
"eval_overall_precision": 0.9115479115479116, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.5947, |
|
"eval_samples_per_second": 285.867, |
|
"eval_steps_per_second": 5.045, |
|
"step": 4128 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"grad_norm": 1.0702989101409912, |
|
"learning_rate": 2.8000000000000003e-05, |
|
"loss": 0.056, |
|
"step": 4224 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_LOCATION_f1": 0.8932038834951457, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8932038834951457, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8979591836734693, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8953488372093024, |
|
"eval_ORGANIZATION_recall": 0.9005847953216374, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04532807692885399, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.91871921182266, |
|
"eval_overall_precision": 0.9164619164619164, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.6003, |
|
"eval_samples_per_second": 283.17, |
|
"eval_steps_per_second": 4.997, |
|
"step": 4224 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"grad_norm": 1.9211422204971313, |
|
"learning_rate": 2.7500000000000004e-05, |
|
"loss": 0.0557, |
|
"step": 4320 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_LOCATION_f1": 0.8761904761904761, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8598130841121495, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8914956011730205, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8941176470588236, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.0455101914703846, |
|
"eval_overall_accuracy": 0.9850869925434963, |
|
"eval_overall_f1": 0.9115479115479117, |
|
"eval_overall_precision": 0.9070904645476773, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.6588, |
|
"eval_samples_per_second": 258.043, |
|
"eval_steps_per_second": 4.554, |
|
"step": 4320 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"grad_norm": 0.976703941822052, |
|
"learning_rate": 2.7000000000000002e-05, |
|
"loss": 0.0565, |
|
"step": 4416 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_LOCATION_f1": 0.8651162790697675, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8303571428571429, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8776119402985074, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8963414634146342, |
|
"eval_ORGANIZATION_recall": 0.8596491228070176, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04744512960314751, |
|
"eval_overall_accuracy": 0.9828776581054958, |
|
"eval_overall_f1": 0.902829028290283, |
|
"eval_overall_precision": 0.8995098039215687, |
|
"eval_overall_recall": 0.9061728395061729, |
|
"eval_runtime": 0.5904, |
|
"eval_samples_per_second": 287.926, |
|
"eval_steps_per_second": 5.081, |
|
"step": 4416 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"grad_norm": 0.8773436546325684, |
|
"learning_rate": 2.6500000000000004e-05, |
|
"loss": 0.0534, |
|
"step": 4512 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_LOCATION_f1": 0.8932038834951457, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8932038834951457, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8985507246376812, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8908045977011494, |
|
"eval_ORGANIZATION_recall": 0.9064327485380117, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04476306214928627, |
|
"eval_overall_accuracy": 0.9859154929577465, |
|
"eval_overall_f1": 0.920049200492005, |
|
"eval_overall_precision": 0.9166666666666666, |
|
"eval_overall_recall": 0.9234567901234568, |
|
"eval_runtime": 0.5945, |
|
"eval_samples_per_second": 285.942, |
|
"eval_steps_per_second": 5.046, |
|
"step": 4512 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"grad_norm": 1.278594970703125, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.0523, |
|
"step": 4608 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8961424332344213, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.9096385542168675, |
|
"eval_ORGANIZATION_recall": 0.8830409356725146, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04515359550714493, |
|
"eval_overall_accuracy": 0.9859154929577465, |
|
"eval_overall_f1": 0.9149198520345252, |
|
"eval_overall_precision": 0.9137931034482759, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.5953, |
|
"eval_samples_per_second": 285.59, |
|
"eval_steps_per_second": 5.04, |
|
"step": 4608 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"grad_norm": 0.56380695104599, |
|
"learning_rate": 2.5500000000000003e-05, |
|
"loss": 0.0523, |
|
"step": 4704 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8856304985337242, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.888235294117647, |
|
"eval_ORGANIZATION_recall": 0.8830409356725146, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04556996375322342, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9104294478527607, |
|
"eval_overall_precision": 0.9048780487804878, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.5918, |
|
"eval_samples_per_second": 287.26, |
|
"eval_steps_per_second": 5.069, |
|
"step": 4704 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"grad_norm": 1.6369190216064453, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.0509, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_LOCATION_f1": 0.8773584905660378, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8532110091743119, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8802395209580838, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.901840490797546, |
|
"eval_ORGANIZATION_recall": 0.8596491228070176, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.046390656381845474, |
|
"eval_overall_accuracy": 0.9828776581054958, |
|
"eval_overall_f1": 0.9084158415841586, |
|
"eval_overall_precision": 0.9106699751861043, |
|
"eval_overall_recall": 0.9061728395061729, |
|
"eval_runtime": 0.6054, |
|
"eval_samples_per_second": 280.8, |
|
"eval_steps_per_second": 4.955, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"grad_norm": 0.7033815383911133, |
|
"learning_rate": 2.45e-05, |
|
"loss": 0.052, |
|
"step": 4896 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_LOCATION_f1": 0.8663594470046084, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8245614035087719, |
|
"eval_LOCATION_recall": 0.912621359223301, |
|
"eval_ORGANIZATION_f1": 0.8795180722891567, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.906832298136646, |
|
"eval_ORGANIZATION_recall": 0.8538011695906432, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04676185920834541, |
|
"eval_overall_accuracy": 0.9842584921292461, |
|
"eval_overall_f1": 0.9050554870530209, |
|
"eval_overall_precision": 0.9039408866995073, |
|
"eval_overall_recall": 0.9061728395061729, |
|
"eval_runtime": 0.5936, |
|
"eval_samples_per_second": 286.386, |
|
"eval_steps_per_second": 5.054, |
|
"step": 4896 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"grad_norm": 0.6778050065040588, |
|
"learning_rate": 2.4e-05, |
|
"loss": 0.0511, |
|
"step": 4992 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_LOCATION_f1": 0.8975609756097561, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.9019607843137255, |
|
"eval_LOCATION_recall": 0.8932038834951457, |
|
"eval_ORGANIZATION_f1": 0.8979591836734693, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8953488372093024, |
|
"eval_ORGANIZATION_recall": 0.9005847953216374, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04431942105293274, |
|
"eval_overall_accuracy": 0.9861916597624966, |
|
"eval_overall_f1": 0.9209876543209876, |
|
"eval_overall_precision": 0.9209876543209876, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.6009, |
|
"eval_samples_per_second": 282.922, |
|
"eval_steps_per_second": 4.993, |
|
"step": 4992 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"grad_norm": 0.7755054831504822, |
|
"learning_rate": 2.35e-05, |
|
"loss": 0.051, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_LOCATION_f1": 0.8773584905660378, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8532110091743119, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8875739644970414, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8982035928143712, |
|
"eval_ORGANIZATION_recall": 0.8771929824561403, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045676685869693756, |
|
"eval_overall_accuracy": 0.983982325324496, |
|
"eval_overall_f1": 0.9102091020910209, |
|
"eval_overall_precision": 0.9068627450980392, |
|
"eval_overall_recall": 0.9135802469135802, |
|
"eval_runtime": 0.61, |
|
"eval_samples_per_second": 278.668, |
|
"eval_steps_per_second": 4.918, |
|
"step": 5088 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"grad_norm": 0.47155851125717163, |
|
"learning_rate": 2.3000000000000003e-05, |
|
"loss": 0.0483, |
|
"step": 5184 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_LOCATION_f1": 0.9029126213592235, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.9029126213592233, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.9017341040462428, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8914285714285715, |
|
"eval_ORGANIZATION_recall": 0.9122807017543859, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.044774431735277176, |
|
"eval_overall_accuracy": 0.9856393261529964, |
|
"eval_overall_f1": 0.9238329238329238, |
|
"eval_overall_precision": 0.9193154034229829, |
|
"eval_overall_recall": 0.928395061728395, |
|
"eval_runtime": 0.5995, |
|
"eval_samples_per_second": 283.593, |
|
"eval_steps_per_second": 5.005, |
|
"step": 5184 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"grad_norm": 1.5237046480178833, |
|
"learning_rate": 2.25e-05, |
|
"loss": 0.0525, |
|
"step": 5280 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_LOCATION_f1": 0.8899521531100479, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8773584905660378, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8953488372093024, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8901734104046243, |
|
"eval_ORGANIZATION_recall": 0.9005847953216374, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04513506591320038, |
|
"eval_overall_accuracy": 0.9853631593482464, |
|
"eval_overall_f1": 0.9177914110429448, |
|
"eval_overall_precision": 0.9121951219512195, |
|
"eval_overall_recall": 0.9234567901234568, |
|
"eval_runtime": 0.6045, |
|
"eval_samples_per_second": 281.204, |
|
"eval_steps_per_second": 4.962, |
|
"step": 5280 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"grad_norm": 0.6528781652450562, |
|
"learning_rate": 2.2000000000000003e-05, |
|
"loss": 0.0479, |
|
"step": 5376 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_LOCATION_f1": 0.8857142857142858, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8691588785046729, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8914956011730205, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8941176470588236, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04449770227074623, |
|
"eval_overall_accuracy": 0.9850869925434963, |
|
"eval_overall_f1": 0.915129151291513, |
|
"eval_overall_precision": 0.9117647058823529, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.5981, |
|
"eval_samples_per_second": 284.219, |
|
"eval_steps_per_second": 5.016, |
|
"step": 5376 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"grad_norm": 1.4258739948272705, |
|
"learning_rate": 2.15e-05, |
|
"loss": 0.0486, |
|
"step": 5472 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_LOCATION_f1": 0.8857142857142858, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8691588785046729, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8888888888888888, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8888888888888888, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9657794676806084, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9621212121212122, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.044527389109134674, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9128834355828221, |
|
"eval_overall_precision": 0.9073170731707317, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.597, |
|
"eval_samples_per_second": 284.74, |
|
"eval_steps_per_second": 5.025, |
|
"step": 5472 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"grad_norm": 0.6324487924575806, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.0457, |
|
"step": 5568 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_LOCATION_f1": 0.8857142857142858, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8691588785046729, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8947368421052632, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8947368421052632, |
|
"eval_ORGANIZATION_recall": 0.8947368421052632, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04367503523826599, |
|
"eval_overall_accuracy": 0.9856393261529964, |
|
"eval_overall_f1": 0.9164619164619164, |
|
"eval_overall_precision": 0.9119804400977995, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.6033, |
|
"eval_samples_per_second": 281.778, |
|
"eval_steps_per_second": 4.973, |
|
"step": 5568 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"grad_norm": 1.5328294038772583, |
|
"learning_rate": 2.05e-05, |
|
"loss": 0.0478, |
|
"step": 5664 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_LOCATION_f1": 0.8773584905660378, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8532110091743119, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8816568047337278, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8922155688622755, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04407254979014397, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9088669950738916, |
|
"eval_overall_precision": 0.9066339066339066, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.6034, |
|
"eval_samples_per_second": 281.724, |
|
"eval_steps_per_second": 4.972, |
|
"step": 5664 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"grad_norm": 0.5337828993797302, |
|
"learning_rate": 2e-05, |
|
"loss": 0.0472, |
|
"step": 5760 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8849557522123894, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8928571428571429, |
|
"eval_ORGANIZATION_recall": 0.8771929824561403, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04403013363480568, |
|
"eval_overall_accuracy": 0.9850869925434963, |
|
"eval_overall_f1": 0.9113300492610836, |
|
"eval_overall_precision": 0.9090909090909091, |
|
"eval_overall_recall": 0.9135802469135802, |
|
"eval_runtime": 0.5975, |
|
"eval_samples_per_second": 284.5, |
|
"eval_steps_per_second": 5.021, |
|
"step": 5760 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"grad_norm": 0.9366702437400818, |
|
"learning_rate": 1.9500000000000003e-05, |
|
"loss": 0.049, |
|
"step": 5856 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_LOCATION_f1": 0.8942307692307693, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8857142857142857, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8895348837209303, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.884393063583815, |
|
"eval_ORGANIZATION_recall": 0.8947368421052632, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04451928660273552, |
|
"eval_overall_accuracy": 0.9853631593482464, |
|
"eval_overall_f1": 0.9164619164619164, |
|
"eval_overall_precision": 0.9119804400977995, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.6062, |
|
"eval_samples_per_second": 280.441, |
|
"eval_steps_per_second": 4.949, |
|
"step": 5856 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"grad_norm": 1.8338637351989746, |
|
"learning_rate": 1.9e-05, |
|
"loss": 0.0476, |
|
"step": 5952 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_LOCATION_f1": 0.869158878504673, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8378378378378378, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.875739644970414, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8862275449101796, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045562200248241425, |
|
"eval_overall_accuracy": 0.983982325324496, |
|
"eval_overall_f1": 0.9041769041769042, |
|
"eval_overall_precision": 0.8997555012224939, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.6542, |
|
"eval_samples_per_second": 259.871, |
|
"eval_steps_per_second": 4.586, |
|
"step": 5952 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"grad_norm": 2.0841386318206787, |
|
"learning_rate": 1.85e-05, |
|
"loss": 0.0457, |
|
"step": 6048 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_LOCATION_f1": 0.8857142857142858, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8691588785046729, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8979591836734693, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8953488372093024, |
|
"eval_ORGANIZATION_recall": 0.9005847953216374, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.043963029980659485, |
|
"eval_overall_accuracy": 0.9859154929577465, |
|
"eval_overall_f1": 0.9177914110429448, |
|
"eval_overall_precision": 0.9121951219512195, |
|
"eval_overall_recall": 0.9234567901234568, |
|
"eval_runtime": 0.6065, |
|
"eval_samples_per_second": 280.291, |
|
"eval_steps_per_second": 4.946, |
|
"step": 6048 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"grad_norm": 0.9337228536605835, |
|
"learning_rate": 1.8e-05, |
|
"loss": 0.0446, |
|
"step": 6144 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_LOCATION_f1": 0.8857142857142858, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8691588785046729, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8882352941176469, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.893491124260355, |
|
"eval_ORGANIZATION_recall": 0.8830409356725146, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04478294402360916, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.9137931034482758, |
|
"eval_overall_precision": 0.9115479115479116, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.5976, |
|
"eval_samples_per_second": 284.482, |
|
"eval_steps_per_second": 5.02, |
|
"step": 6144 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"grad_norm": 1.0935461521148682, |
|
"learning_rate": 1.75e-05, |
|
"loss": 0.0465, |
|
"step": 6240 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_LOCATION_f1": 0.8826291079812206, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8545454545454545, |
|
"eval_LOCATION_recall": 0.912621359223301, |
|
"eval_ORGANIZATION_f1": 0.8908554572271385, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8988095238095238, |
|
"eval_ORGANIZATION_recall": 0.8830409356725146, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04469531029462814, |
|
"eval_overall_accuracy": 0.9856393261529964, |
|
"eval_overall_f1": 0.914004914004914, |
|
"eval_overall_precision": 0.9095354523227384, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.603, |
|
"eval_samples_per_second": 281.935, |
|
"eval_steps_per_second": 4.975, |
|
"step": 6240 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"grad_norm": 0.588843584060669, |
|
"learning_rate": 1.7000000000000003e-05, |
|
"loss": 0.0456, |
|
"step": 6336 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_LOCATION_f1": 0.8857142857142858, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8691588785046729, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8842729970326408, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8975903614457831, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04511041194200516, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9122373300370827, |
|
"eval_overall_precision": 0.9133663366336634, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5959, |
|
"eval_samples_per_second": 285.269, |
|
"eval_steps_per_second": 5.034, |
|
"step": 6336 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"grad_norm": 0.40730783343315125, |
|
"learning_rate": 1.65e-05, |
|
"loss": 0.043, |
|
"step": 6432 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.874251497005988, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8957055214723927, |
|
"eval_ORGANIZATION_recall": 0.8538011695906432, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04662081599235535, |
|
"eval_overall_accuracy": 0.9823253244959956, |
|
"eval_overall_f1": 0.9070631970260223, |
|
"eval_overall_precision": 0.9104477611940298, |
|
"eval_overall_recall": 0.9037037037037037, |
|
"eval_runtime": 0.5968, |
|
"eval_samples_per_second": 284.867, |
|
"eval_steps_per_second": 5.027, |
|
"step": 6432 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"grad_norm": 1.010898470878601, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.0441, |
|
"step": 6528 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_LOCATION_f1": 0.8909952606635072, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8703703703703703, |
|
"eval_LOCATION_recall": 0.912621359223301, |
|
"eval_ORGANIZATION_f1": 0.879765395894428, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8823529411764706, |
|
"eval_ORGANIZATION_recall": 0.8771929824561403, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04551886394619942, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.9115479115479117, |
|
"eval_overall_precision": 0.9070904645476773, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.6631, |
|
"eval_samples_per_second": 256.37, |
|
"eval_steps_per_second": 4.524, |
|
"step": 6528 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"grad_norm": 0.356332927942276, |
|
"learning_rate": 1.55e-05, |
|
"loss": 0.0439, |
|
"step": 6624 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_LOCATION_f1": 0.8857142857142858, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8691588785046729, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.879765395894428, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8823529411764706, |
|
"eval_ORGANIZATION_recall": 0.8771929824561403, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04542705416679382, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9102091020910209, |
|
"eval_overall_precision": 0.9068627450980392, |
|
"eval_overall_recall": 0.9135802469135802, |
|
"eval_runtime": 0.5976, |
|
"eval_samples_per_second": 284.455, |
|
"eval_steps_per_second": 5.02, |
|
"step": 6624 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"grad_norm": 0.5880185961723328, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.0439, |
|
"step": 6720 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8882352941176469, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.893491124260355, |
|
"eval_ORGANIZATION_recall": 0.8830409356725146, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.044994134455919266, |
|
"eval_overall_accuracy": 0.9850869925434963, |
|
"eval_overall_f1": 0.9126691266912669, |
|
"eval_overall_precision": 0.9093137254901961, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.597, |
|
"eval_samples_per_second": 284.742, |
|
"eval_steps_per_second": 5.025, |
|
"step": 6720 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"grad_norm": 0.9274646639823914, |
|
"learning_rate": 1.45e-05, |
|
"loss": 0.0428, |
|
"step": 6816 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_LOCATION_f1": 0.8952380952380954, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8785046728971962, |
|
"eval_LOCATION_recall": 0.912621359223301, |
|
"eval_ORGANIZATION_f1": 0.8888888888888888, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8888888888888888, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04472970589995384, |
|
"eval_overall_accuracy": 0.9859154929577465, |
|
"eval_overall_f1": 0.9164619164619164, |
|
"eval_overall_precision": 0.9119804400977995, |
|
"eval_overall_recall": 0.9209876543209876, |
|
"eval_runtime": 0.5987, |
|
"eval_samples_per_second": 283.931, |
|
"eval_steps_per_second": 5.011, |
|
"step": 6816 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"grad_norm": 0.35504868626594543, |
|
"learning_rate": 1.4000000000000001e-05, |
|
"loss": 0.0438, |
|
"step": 6912 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8795180722891567, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.906832298136646, |
|
"eval_ORGANIZATION_recall": 0.8538011695906432, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.046420272439718246, |
|
"eval_overall_accuracy": 0.9828776581054958, |
|
"eval_overall_f1": 0.9093167701863354, |
|
"eval_overall_precision": 0.915, |
|
"eval_overall_recall": 0.9037037037037037, |
|
"eval_runtime": 0.5929, |
|
"eval_samples_per_second": 286.713, |
|
"eval_steps_per_second": 5.06, |
|
"step": 6912 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"grad_norm": 1.1146135330200195, |
|
"learning_rate": 1.3500000000000001e-05, |
|
"loss": 0.0431, |
|
"step": 7008 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_LOCATION_f1": 0.8867924528301887, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8623853211009175, |
|
"eval_LOCATION_recall": 0.912621359223301, |
|
"eval_ORGANIZATION_f1": 0.8823529411764705, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8875739644970414, |
|
"eval_ORGANIZATION_recall": 0.8771929824561403, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.044833190739154816, |
|
"eval_overall_accuracy": 0.9856393261529964, |
|
"eval_overall_f1": 0.9115479115479117, |
|
"eval_overall_precision": 0.9070904645476773, |
|
"eval_overall_recall": 0.9160493827160494, |
|
"eval_runtime": 0.606, |
|
"eval_samples_per_second": 280.509, |
|
"eval_steps_per_second": 4.95, |
|
"step": 7008 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"grad_norm": 0.3997597396373749, |
|
"learning_rate": 1.3000000000000001e-05, |
|
"loss": 0.0415, |
|
"step": 7104 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_LOCATION_f1": 0.8773584905660378, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8532110091743119, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.875739644970414, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8862275449101796, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04576844349503517, |
|
"eval_overall_accuracy": 0.9842584921292461, |
|
"eval_overall_f1": 0.9064039408866995, |
|
"eval_overall_precision": 0.9041769041769042, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.6179, |
|
"eval_samples_per_second": 275.116, |
|
"eval_steps_per_second": 4.855, |
|
"step": 7104 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"grad_norm": 0.6900985836982727, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0429, |
|
"step": 7200 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8731563421828908, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8809523809523809, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.046131208539009094, |
|
"eval_overall_accuracy": 0.983982325324496, |
|
"eval_overall_f1": 0.9064039408866995, |
|
"eval_overall_precision": 0.9041769041769042, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.6007, |
|
"eval_samples_per_second": 283.003, |
|
"eval_steps_per_second": 4.994, |
|
"step": 7200 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"grad_norm": 0.35220813751220703, |
|
"learning_rate": 1.2e-05, |
|
"loss": 0.0426, |
|
"step": 7296 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8731563421828908, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8809523809523809, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04544881358742714, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.9064039408866995, |
|
"eval_overall_precision": 0.9041769041769042, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.5968, |
|
"eval_samples_per_second": 284.861, |
|
"eval_steps_per_second": 5.027, |
|
"step": 7296 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"grad_norm": 0.7620628476142883, |
|
"learning_rate": 1.1500000000000002e-05, |
|
"loss": 0.043, |
|
"step": 7392 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_LOCATION_f1": 0.8857142857142858, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8691588785046729, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.875739644970414, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8862275449101796, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04560285061597824, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.908641975308642, |
|
"eval_overall_precision": 0.908641975308642, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.5922, |
|
"eval_samples_per_second": 287.086, |
|
"eval_steps_per_second": 5.066, |
|
"step": 7392 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"grad_norm": 0.6972180008888245, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.0397, |
|
"step": 7488 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8842729970326408, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8975903614457831, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045004814863204956, |
|
"eval_overall_accuracy": 0.9856393261529964, |
|
"eval_overall_f1": 0.9111111111111111, |
|
"eval_overall_precision": 0.9111111111111111, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5949, |
|
"eval_samples_per_second": 285.753, |
|
"eval_steps_per_second": 5.043, |
|
"step": 7488 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"grad_norm": 1.175458312034607, |
|
"learning_rate": 1.05e-05, |
|
"loss": 0.0411, |
|
"step": 7584 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8731563421828908, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8809523809523809, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04489603638648987, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9064039408866995, |
|
"eval_overall_precision": 0.9041769041769042, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.5924, |
|
"eval_samples_per_second": 286.953, |
|
"eval_steps_per_second": 5.064, |
|
"step": 7584 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"grad_norm": 1.935158610343933, |
|
"learning_rate": 1e-05, |
|
"loss": 0.0417, |
|
"step": 7680 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8823529411764705, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8875739644970414, |
|
"eval_ORGANIZATION_recall": 0.8771929824561403, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04481157660484314, |
|
"eval_overall_accuracy": 0.9856393261529964, |
|
"eval_overall_f1": 0.9102091020910209, |
|
"eval_overall_precision": 0.9068627450980392, |
|
"eval_overall_recall": 0.9135802469135802, |
|
"eval_runtime": 0.6085, |
|
"eval_samples_per_second": 279.37, |
|
"eval_steps_per_second": 4.93, |
|
"step": 7680 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"grad_norm": 0.7792730927467346, |
|
"learning_rate": 9.5e-06, |
|
"loss": 0.0423, |
|
"step": 7776 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8823529411764705, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8875739644970414, |
|
"eval_ORGANIZATION_recall": 0.8771929824561403, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04457651078701019, |
|
"eval_overall_accuracy": 0.9856393261529964, |
|
"eval_overall_f1": 0.9102091020910209, |
|
"eval_overall_precision": 0.9068627450980392, |
|
"eval_overall_recall": 0.9135802469135802, |
|
"eval_runtime": 0.6034, |
|
"eval_samples_per_second": 281.758, |
|
"eval_steps_per_second": 4.972, |
|
"step": 7776 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"grad_norm": 1.640648365020752, |
|
"learning_rate": 9e-06, |
|
"loss": 0.0434, |
|
"step": 7872 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8994082840236686, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.9101796407185628, |
|
"eval_ORGANIZATION_recall": 0.8888888888888888, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04452081397175789, |
|
"eval_overall_accuracy": 0.9861916597624966, |
|
"eval_overall_f1": 0.9173859432799014, |
|
"eval_overall_precision": 0.916256157635468, |
|
"eval_overall_recall": 0.9185185185185185, |
|
"eval_runtime": 0.6038, |
|
"eval_samples_per_second": 281.535, |
|
"eval_steps_per_second": 4.968, |
|
"step": 7872 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"grad_norm": 0.8310399651527405, |
|
"learning_rate": 8.500000000000002e-06, |
|
"loss": 0.0394, |
|
"step": 7968 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8731563421828908, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8809523809523809, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04489120468497276, |
|
"eval_overall_accuracy": 0.9850869925434963, |
|
"eval_overall_f1": 0.9064039408866995, |
|
"eval_overall_precision": 0.9041769041769042, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.6046, |
|
"eval_samples_per_second": 281.181, |
|
"eval_steps_per_second": 4.962, |
|
"step": 7968 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"grad_norm": 0.9918228387832642, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0413, |
|
"step": 8064 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8809523809523809, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.896969696969697, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04544991999864578, |
|
"eval_overall_accuracy": 0.9850869925434963, |
|
"eval_overall_f1": 0.9097651421508034, |
|
"eval_overall_precision": 0.9108910891089109, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.6004, |
|
"eval_samples_per_second": 283.156, |
|
"eval_steps_per_second": 4.997, |
|
"step": 8064 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"grad_norm": 0.9799830317497253, |
|
"learning_rate": 7.5e-06, |
|
"loss": 0.0408, |
|
"step": 8160 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8783382789317508, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.891566265060241, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045652709901332855, |
|
"eval_overall_accuracy": 0.9842584921292461, |
|
"eval_overall_f1": 0.908641975308642, |
|
"eval_overall_precision": 0.908641975308642, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.604, |
|
"eval_samples_per_second": 281.458, |
|
"eval_steps_per_second": 4.967, |
|
"step": 8160 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"grad_norm": 1.889784574508667, |
|
"learning_rate": 7.000000000000001e-06, |
|
"loss": 0.0412, |
|
"step": 8256 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8731563421828908, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8809523809523809, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045468661934137344, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.9064039408866995, |
|
"eval_overall_precision": 0.9041769041769042, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.6007, |
|
"eval_samples_per_second": 283.007, |
|
"eval_steps_per_second": 4.994, |
|
"step": 8256 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"grad_norm": 1.0306001901626587, |
|
"learning_rate": 6.5000000000000004e-06, |
|
"loss": 0.0425, |
|
"step": 8352 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8731563421828908, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8809523809523809, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045380450785160065, |
|
"eval_overall_accuracy": 0.9842584921292461, |
|
"eval_overall_f1": 0.9064039408866995, |
|
"eval_overall_precision": 0.9041769041769042, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.607, |
|
"eval_samples_per_second": 280.052, |
|
"eval_steps_per_second": 4.942, |
|
"step": 8352 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"grad_norm": 1.6095170974731445, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0404, |
|
"step": 8448 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8764705882352941, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8816568047337278, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045171529054641724, |
|
"eval_overall_accuracy": 0.9850869925434963, |
|
"eval_overall_f1": 0.9077490774907748, |
|
"eval_overall_precision": 0.9044117647058824, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5928, |
|
"eval_samples_per_second": 286.772, |
|
"eval_steps_per_second": 5.061, |
|
"step": 8448 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"grad_norm": 1.9292471408843994, |
|
"learning_rate": 5.500000000000001e-06, |
|
"loss": 0.0403, |
|
"step": 8544 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.875739644970414, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8862275449101796, |
|
"eval_ORGANIZATION_recall": 0.8654970760233918, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04589909315109253, |
|
"eval_overall_accuracy": 0.9842584921292461, |
|
"eval_overall_f1": 0.9075215782983971, |
|
"eval_overall_precision": 0.9064039408866995, |
|
"eval_overall_recall": 0.908641975308642, |
|
"eval_runtime": 0.6049, |
|
"eval_samples_per_second": 281.046, |
|
"eval_steps_per_second": 4.96, |
|
"step": 8544 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"grad_norm": 0.9496196508407593, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0395, |
|
"step": 8640 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8739002932551321, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8764705882352941, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04514380544424057, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.9066339066339066, |
|
"eval_overall_precision": 0.902200488997555, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.6057, |
|
"eval_samples_per_second": 280.676, |
|
"eval_steps_per_second": 4.953, |
|
"step": 8640 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"grad_norm": 1.498864769935608, |
|
"learning_rate": 4.5e-06, |
|
"loss": 0.0413, |
|
"step": 8736 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8739002932551321, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8764705882352941, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04504216089844704, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9066339066339066, |
|
"eval_overall_precision": 0.902200488997555, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.6, |
|
"eval_samples_per_second": 283.336, |
|
"eval_steps_per_second": 5.0, |
|
"step": 8736 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"grad_norm": 0.8939065337181091, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.039, |
|
"step": 8832 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8739002932551321, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8764705882352941, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04519949480891228, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9066339066339066, |
|
"eval_overall_precision": 0.902200488997555, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.6015, |
|
"eval_samples_per_second": 282.646, |
|
"eval_steps_per_second": 4.988, |
|
"step": 8832 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"grad_norm": 76.55709838867188, |
|
"learning_rate": 3.5000000000000004e-06, |
|
"loss": 0.0402, |
|
"step": 8928 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8764705882352941, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8816568047337278, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045382946729660034, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9077490774907748, |
|
"eval_overall_precision": 0.9044117647058824, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5985, |
|
"eval_samples_per_second": 284.026, |
|
"eval_steps_per_second": 5.012, |
|
"step": 8928 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"grad_norm": 0.24397915601730347, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0397, |
|
"step": 9024 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8739002932551321, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8764705882352941, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045313529670238495, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9066339066339066, |
|
"eval_overall_precision": 0.902200488997555, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5887, |
|
"eval_samples_per_second": 288.767, |
|
"eval_steps_per_second": 5.096, |
|
"step": 9024 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"grad_norm": 0.29766303300857544, |
|
"learning_rate": 2.5e-06, |
|
"loss": 0.0409, |
|
"step": 9120 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8764705882352941, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8816568047337278, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045457012951374054, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9077490774907748, |
|
"eval_overall_precision": 0.9044117647058824, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5948, |
|
"eval_samples_per_second": 285.825, |
|
"eval_steps_per_second": 5.044, |
|
"step": 9120 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"grad_norm": 1.5634249448776245, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.039, |
|
"step": 9216 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8739002932551321, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8764705882352941, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.0454791858792305, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.9066339066339066, |
|
"eval_overall_precision": 0.902200488997555, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5934, |
|
"eval_samples_per_second": 286.492, |
|
"eval_steps_per_second": 5.056, |
|
"step": 9216 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"grad_norm": 0.9605298042297363, |
|
"learning_rate": 1.5e-06, |
|
"loss": 0.0402, |
|
"step": 9312 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8739002932551321, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8764705882352941, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.0456123985350132, |
|
"eval_overall_accuracy": 0.9845346589339962, |
|
"eval_overall_f1": 0.9066339066339066, |
|
"eval_overall_precision": 0.902200488997555, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.6745, |
|
"eval_samples_per_second": 252.035, |
|
"eval_steps_per_second": 4.448, |
|
"step": 9312 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"grad_norm": 1.7611069679260254, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0382, |
|
"step": 9408 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8764705882352941, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8816568047337278, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04547755792737007, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9077490774907748, |
|
"eval_overall_precision": 0.9044117647058824, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5989, |
|
"eval_samples_per_second": 283.847, |
|
"eval_steps_per_second": 5.009, |
|
"step": 9408 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"grad_norm": 0.4898216426372528, |
|
"learning_rate": 5.000000000000001e-07, |
|
"loss": 0.0392, |
|
"step": 9504 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8764705882352941, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8816568047337278, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.04550032317638397, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9077490774907748, |
|
"eval_overall_precision": 0.9044117647058824, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.5984, |
|
"eval_samples_per_second": 284.085, |
|
"eval_steps_per_second": 5.013, |
|
"step": 9504 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"grad_norm": 1.0116997957229614, |
|
"learning_rate": 0.0, |
|
"loss": 0.0412, |
|
"step": 9600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_LOCATION_f1": 0.8815165876777251, |
|
"eval_LOCATION_number": 103, |
|
"eval_LOCATION_precision": 0.8611111111111112, |
|
"eval_LOCATION_recall": 0.9029126213592233, |
|
"eval_ORGANIZATION_f1": 0.8764705882352941, |
|
"eval_ORGANIZATION_number": 171, |
|
"eval_ORGANIZATION_precision": 0.8816568047337278, |
|
"eval_ORGANIZATION_recall": 0.8713450292397661, |
|
"eval_PERSON_f1": 0.9694656488549618, |
|
"eval_PERSON_number": 131, |
|
"eval_PERSON_precision": 0.9694656488549618, |
|
"eval_PERSON_recall": 0.9694656488549618, |
|
"eval_loss": 0.045390497893095016, |
|
"eval_overall_accuracy": 0.9848108257387462, |
|
"eval_overall_f1": 0.9077490774907748, |
|
"eval_overall_precision": 0.9044117647058824, |
|
"eval_overall_recall": 0.9111111111111111, |
|
"eval_runtime": 0.6032, |
|
"eval_samples_per_second": 281.85, |
|
"eval_steps_per_second": 4.974, |
|
"step": 9600 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"step": 9600, |
|
"total_flos": 3889996718638620.0, |
|
"train_loss": 0.09181262865662575, |
|
"train_runtime": 1037.4922, |
|
"train_samples_per_second": 147.567, |
|
"train_steps_per_second": 9.253 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 9600, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 100, |
|
"save_steps": 500, |
|
"total_flos": 3889996718638620.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|