|
{ |
|
"best_metric": 0.3805309734513274, |
|
"best_model_checkpoint": "car_identified_model_7/checkpoint-188", |
|
"epoch": 145.45454545454547, |
|
"eval_steps": 500, |
|
"global_step": 200, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.73, |
|
"learning_rate": 1.9900000000000003e-05, |
|
"loss": 0.6919, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.17857142857142858, |
|
"eval_loss": 0.6887282133102417, |
|
"eval_roc_auc": 0.5737577639751552, |
|
"eval_runtime": 2.8648, |
|
"eval_samples_per_second": 14.661, |
|
"eval_steps_per_second": 1.047, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.1818181818181818, |
|
"eval_loss": 0.6855647563934326, |
|
"eval_roc_auc": 0.5760869565217391, |
|
"eval_runtime": 2.5822, |
|
"eval_samples_per_second": 16.265, |
|
"eval_steps_per_second": 1.162, |
|
"step": 2 |
|
}, |
|
{ |
|
"epoch": 2.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.21164021164021166, |
|
"eval_loss": 0.6802406311035156, |
|
"eval_roc_auc": 0.6066252587991718, |
|
"eval_runtime": 2.1976, |
|
"eval_samples_per_second": 19.112, |
|
"eval_steps_per_second": 1.365, |
|
"step": 4 |
|
}, |
|
{ |
|
"epoch": 3.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.18614718614718614, |
|
"eval_loss": 0.6800228953361511, |
|
"eval_roc_auc": 0.5825569358178053, |
|
"eval_runtime": 2.1512, |
|
"eval_samples_per_second": 19.524, |
|
"eval_steps_per_second": 1.395, |
|
"step": 5 |
|
}, |
|
{ |
|
"epoch": 4.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.1904761904761905, |
|
"eval_loss": 0.6858328580856323, |
|
"eval_roc_auc": 0.5973084886128365, |
|
"eval_runtime": 1.8993, |
|
"eval_samples_per_second": 22.113, |
|
"eval_steps_per_second": 1.58, |
|
"step": 6 |
|
}, |
|
{ |
|
"epoch": 5.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.15492957746478872, |
|
"eval_loss": 0.693770706653595, |
|
"eval_roc_auc": 0.5341614906832298, |
|
"eval_runtime": 1.986, |
|
"eval_samples_per_second": 21.148, |
|
"eval_steps_per_second": 1.511, |
|
"step": 8 |
|
}, |
|
{ |
|
"epoch": 6.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.18050541516245489, |
|
"eval_loss": 0.6917278170585632, |
|
"eval_roc_auc": 0.5802277432712216, |
|
"eval_runtime": 1.8331, |
|
"eval_samples_per_second": 22.911, |
|
"eval_steps_per_second": 1.637, |
|
"step": 9 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.19047619047619044, |
|
"eval_loss": 0.6735165119171143, |
|
"eval_roc_auc": 0.593167701863354, |
|
"eval_runtime": 2.0579, |
|
"eval_samples_per_second": 20.409, |
|
"eval_steps_per_second": 1.458, |
|
"step": 11 |
|
}, |
|
{ |
|
"epoch": 8.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.1952191235059761, |
|
"eval_loss": 0.6727393865585327, |
|
"eval_roc_auc": 0.6006728778467909, |
|
"eval_runtime": 1.8528, |
|
"eval_samples_per_second": 22.669, |
|
"eval_steps_per_second": 1.619, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 9.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.20606060606060606, |
|
"eval_loss": 0.6698008179664612, |
|
"eval_roc_auc": 0.6172360248447204, |
|
"eval_runtime": 2.0897, |
|
"eval_samples_per_second": 20.099, |
|
"eval_steps_per_second": 1.436, |
|
"step": 13 |
|
}, |
|
{ |
|
"epoch": 10.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.20080321285140562, |
|
"eval_loss": 0.6671529412269592, |
|
"eval_roc_auc": 0.6092132505175983, |
|
"eval_runtime": 1.8899, |
|
"eval_samples_per_second": 22.224, |
|
"eval_steps_per_second": 1.587, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 11.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2092050209205021, |
|
"eval_loss": 0.6645169854164124, |
|
"eval_roc_auc": 0.6195652173913044, |
|
"eval_runtime": 1.9211, |
|
"eval_samples_per_second": 21.863, |
|
"eval_steps_per_second": 1.562, |
|
"step": 16 |
|
}, |
|
{ |
|
"epoch": 12.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.20491803278688525, |
|
"eval_loss": 0.6645674705505371, |
|
"eval_roc_auc": 0.6143892339544513, |
|
"eval_runtime": 1.9806, |
|
"eval_samples_per_second": 21.206, |
|
"eval_steps_per_second": 1.515, |
|
"step": 17 |
|
}, |
|
{ |
|
"epoch": 13.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.208067940552017, |
|
"eval_loss": 0.6622694134712219, |
|
"eval_roc_auc": 0.6167184265010353, |
|
"eval_runtime": 2.0813, |
|
"eval_samples_per_second": 20.179, |
|
"eval_steps_per_second": 1.441, |
|
"step": 19 |
|
}, |
|
{ |
|
"epoch": 14.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.20779220779220778, |
|
"eval_loss": 0.6606575846672058, |
|
"eval_roc_auc": 0.6149068322981366, |
|
"eval_runtime": 1.8418, |
|
"eval_samples_per_second": 22.803, |
|
"eval_steps_per_second": 1.629, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.22026431718061673, |
|
"eval_loss": 0.6584673523902893, |
|
"eval_roc_auc": 0.6319875776397516, |
|
"eval_runtime": 2.024, |
|
"eval_samples_per_second": 20.751, |
|
"eval_steps_per_second": 1.482, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 16.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.21559633027522934, |
|
"eval_loss": 0.6561669111251831, |
|
"eval_roc_auc": 0.6218944099378882, |
|
"eval_runtime": 1.8303, |
|
"eval_samples_per_second": 22.947, |
|
"eval_steps_per_second": 1.639, |
|
"step": 23 |
|
}, |
|
{ |
|
"epoch": 17.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.21818181818181817, |
|
"eval_loss": 0.6555350422859192, |
|
"eval_roc_auc": 0.6262939958592133, |
|
"eval_runtime": 1.9854, |
|
"eval_samples_per_second": 21.154, |
|
"eval_steps_per_second": 1.511, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 18.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2185273159144893, |
|
"eval_loss": 0.652241051197052, |
|
"eval_roc_auc": 0.6231884057971014, |
|
"eval_runtime": 1.9789, |
|
"eval_samples_per_second": 21.224, |
|
"eval_steps_per_second": 1.516, |
|
"step": 26 |
|
}, |
|
{ |
|
"epoch": 19.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.22276029055690072, |
|
"eval_loss": 0.6512007713317871, |
|
"eval_roc_auc": 0.6273291925465838, |
|
"eval_runtime": 2.0333, |
|
"eval_samples_per_second": 20.656, |
|
"eval_steps_per_second": 1.475, |
|
"step": 27 |
|
}, |
|
{ |
|
"epoch": 20.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.23558897243107768, |
|
"eval_loss": 0.6501262187957764, |
|
"eval_roc_auc": 0.6410455486542443, |
|
"eval_runtime": 2.1299, |
|
"eval_samples_per_second": 19.719, |
|
"eval_steps_per_second": 1.409, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 21.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.22797927461139897, |
|
"eval_loss": 0.6477265357971191, |
|
"eval_roc_auc": 0.6283643892339545, |
|
"eval_runtime": 1.8983, |
|
"eval_samples_per_second": 22.125, |
|
"eval_steps_per_second": 1.58, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 22.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.23255813953488372, |
|
"eval_loss": 0.6476041078567505, |
|
"eval_roc_auc": 0.6343167701863355, |
|
"eval_runtime": 2.1591, |
|
"eval_samples_per_second": 19.452, |
|
"eval_steps_per_second": 1.389, |
|
"step": 31 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.24083769633507857, |
|
"eval_loss": 0.6469409465789795, |
|
"eval_roc_auc": 0.6433747412008282, |
|
"eval_runtime": 1.8477, |
|
"eval_samples_per_second": 22.731, |
|
"eval_steps_per_second": 1.624, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 24.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.24089635854341737, |
|
"eval_loss": 0.6432453393936157, |
|
"eval_roc_auc": 0.6369047619047619, |
|
"eval_runtime": 2.1797, |
|
"eval_samples_per_second": 19.268, |
|
"eval_steps_per_second": 1.376, |
|
"step": 34 |
|
}, |
|
{ |
|
"epoch": 25.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2430939226519337, |
|
"eval_loss": 0.6432364583015442, |
|
"eval_roc_auc": 0.6407867494824016, |
|
"eval_runtime": 1.9386, |
|
"eval_samples_per_second": 21.665, |
|
"eval_steps_per_second": 1.547, |
|
"step": 35 |
|
}, |
|
{ |
|
"epoch": 26.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.24858757062146897, |
|
"eval_loss": 0.6401556730270386, |
|
"eval_roc_auc": 0.644927536231884, |
|
"eval_runtime": 1.9831, |
|
"eval_samples_per_second": 21.179, |
|
"eval_steps_per_second": 1.513, |
|
"step": 37 |
|
}, |
|
{ |
|
"epoch": 27.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.26857142857142857, |
|
"eval_loss": 0.6385589838027954, |
|
"eval_roc_auc": 0.666407867494824, |
|
"eval_runtime": 1.8248, |
|
"eval_samples_per_second": 23.016, |
|
"eval_steps_per_second": 1.644, |
|
"step": 38 |
|
}, |
|
{ |
|
"epoch": 28.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.27624309392265195, |
|
"eval_loss": 0.6375865936279297, |
|
"eval_roc_auc": 0.6796066252587992, |
|
"eval_runtime": 2.0365, |
|
"eval_samples_per_second": 20.624, |
|
"eval_steps_per_second": 1.473, |
|
"step": 39 |
|
}, |
|
{ |
|
"epoch": 29.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2692307692307692, |
|
"eval_loss": 0.6347113847732544, |
|
"eval_roc_auc": 0.6721014492753624, |
|
"eval_runtime": 2.0248, |
|
"eval_samples_per_second": 20.743, |
|
"eval_steps_per_second": 1.482, |
|
"step": 41 |
|
}, |
|
{ |
|
"epoch": 30.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.26553672316384186, |
|
"eval_loss": 0.6338767409324646, |
|
"eval_roc_auc": 0.6643374741200828, |
|
"eval_runtime": 1.912, |
|
"eval_samples_per_second": 21.966, |
|
"eval_steps_per_second": 1.569, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2674418604651163, |
|
"eval_loss": 0.6310274004936218, |
|
"eval_roc_auc": 0.6630434782608696, |
|
"eval_runtime": 2.048, |
|
"eval_samples_per_second": 20.508, |
|
"eval_steps_per_second": 1.465, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 32.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.27893175074183973, |
|
"eval_loss": 0.630736768245697, |
|
"eval_roc_auc": 0.6731366459627329, |
|
"eval_runtime": 1.9873, |
|
"eval_samples_per_second": 21.134, |
|
"eval_steps_per_second": 1.51, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 33.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2713864306784661, |
|
"eval_loss": 0.6290633678436279, |
|
"eval_roc_auc": 0.6656314699792961, |
|
"eval_runtime": 1.9917, |
|
"eval_samples_per_second": 21.087, |
|
"eval_steps_per_second": 1.506, |
|
"step": 46 |
|
}, |
|
{ |
|
"epoch": 34.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2760736196319018, |
|
"eval_loss": 0.6271013617515564, |
|
"eval_roc_auc": 0.6658902691511386, |
|
"eval_runtime": 1.9904, |
|
"eval_samples_per_second": 21.101, |
|
"eval_steps_per_second": 1.507, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 35.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2686567164179105, |
|
"eval_loss": 0.6270779371261597, |
|
"eval_roc_auc": 0.661231884057971, |
|
"eval_runtime": 2.05, |
|
"eval_samples_per_second": 20.488, |
|
"eval_steps_per_second": 1.463, |
|
"step": 49 |
|
}, |
|
{ |
|
"epoch": 36.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2606060606060606, |
|
"eval_loss": 0.6277384757995605, |
|
"eval_roc_auc": 0.650879917184265, |
|
"eval_runtime": 1.8738, |
|
"eval_samples_per_second": 22.415, |
|
"eval_steps_per_second": 1.601, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 37.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2741433021806854, |
|
"eval_loss": 0.6256951689720154, |
|
"eval_roc_auc": 0.6620082815734989, |
|
"eval_runtime": 2.0555, |
|
"eval_samples_per_second": 20.433, |
|
"eval_steps_per_second": 1.459, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 38.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.28923076923076924, |
|
"eval_loss": 0.624409556388855, |
|
"eval_roc_auc": 0.6793478260869565, |
|
"eval_runtime": 1.842, |
|
"eval_samples_per_second": 22.801, |
|
"eval_steps_per_second": 1.629, |
|
"step": 53 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.29677419354838713, |
|
"eval_loss": 0.6203488111495972, |
|
"eval_roc_auc": 0.6806418219461698, |
|
"eval_runtime": 1.9945, |
|
"eval_samples_per_second": 21.058, |
|
"eval_steps_per_second": 1.504, |
|
"step": 55 |
|
}, |
|
{ |
|
"epoch": 40.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2902208201892744, |
|
"eval_loss": 0.6198378801345825, |
|
"eval_roc_auc": 0.6770186335403728, |
|
"eval_runtime": 1.9168, |
|
"eval_samples_per_second": 21.912, |
|
"eval_steps_per_second": 1.565, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 41.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3022508038585209, |
|
"eval_loss": 0.6183561682701111, |
|
"eval_roc_auc": 0.6865942028985508, |
|
"eval_runtime": 2.0474, |
|
"eval_samples_per_second": 20.514, |
|
"eval_steps_per_second": 1.465, |
|
"step": 57 |
|
}, |
|
{ |
|
"epoch": 42.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2977346278317152, |
|
"eval_loss": 0.6163293719291687, |
|
"eval_roc_auc": 0.6811594202898551, |
|
"eval_runtime": 2.0211, |
|
"eval_samples_per_second": 20.781, |
|
"eval_steps_per_second": 1.484, |
|
"step": 59 |
|
}, |
|
{ |
|
"epoch": 43.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.33222591362126247, |
|
"eval_loss": 0.6147304177284241, |
|
"eval_roc_auc": 0.7111801242236025, |
|
"eval_runtime": 1.8612, |
|
"eval_samples_per_second": 22.566, |
|
"eval_steps_per_second": 1.612, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 44.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3197278911564626, |
|
"eval_loss": 0.6154341697692871, |
|
"eval_roc_auc": 0.6953933747412009, |
|
"eval_runtime": 2.1228, |
|
"eval_samples_per_second": 19.785, |
|
"eval_steps_per_second": 1.413, |
|
"step": 61 |
|
}, |
|
{ |
|
"epoch": 45.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.30163934426229505, |
|
"eval_loss": 0.6129170060157776, |
|
"eval_roc_auc": 0.6832298136645963, |
|
"eval_runtime": 1.8919, |
|
"eval_samples_per_second": 22.2, |
|
"eval_steps_per_second": 1.586, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 46.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.30201342281879195, |
|
"eval_loss": 0.6111928224563599, |
|
"eval_roc_auc": 0.680383022774327, |
|
"eval_runtime": 2.0579, |
|
"eval_samples_per_second": 20.409, |
|
"eval_steps_per_second": 1.458, |
|
"step": 64 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.29605263157894735, |
|
"eval_loss": 0.60954749584198, |
|
"eval_roc_auc": 0.6772774327122153, |
|
"eval_runtime": 2.0077, |
|
"eval_samples_per_second": 20.92, |
|
"eval_steps_per_second": 1.494, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 48.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.31333333333333335, |
|
"eval_loss": 0.6090860962867737, |
|
"eval_roc_auc": 0.692287784679089, |
|
"eval_runtime": 1.8446, |
|
"eval_samples_per_second": 22.769, |
|
"eval_steps_per_second": 1.626, |
|
"step": 67 |
|
}, |
|
{ |
|
"epoch": 49.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.32653061224489793, |
|
"eval_loss": 0.6089531183242798, |
|
"eval_roc_auc": 0.7018633540372671, |
|
"eval_runtime": 2.0701, |
|
"eval_samples_per_second": 20.289, |
|
"eval_steps_per_second": 1.449, |
|
"step": 68 |
|
}, |
|
{ |
|
"epoch": 50.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.30927835051546393, |
|
"eval_loss": 0.6077401638031006, |
|
"eval_roc_auc": 0.6840062111801242, |
|
"eval_runtime": 1.8396, |
|
"eval_samples_per_second": 22.832, |
|
"eval_steps_per_second": 1.631, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 51.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.32394366197183105, |
|
"eval_loss": 0.6065036654472351, |
|
"eval_roc_auc": 0.6940993788819875, |
|
"eval_runtime": 2.0429, |
|
"eval_samples_per_second": 20.559, |
|
"eval_steps_per_second": 1.469, |
|
"step": 71 |
|
}, |
|
{ |
|
"epoch": 52.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.32374100719424465, |
|
"eval_loss": 0.6057615876197815, |
|
"eval_roc_auc": 0.690734989648033, |
|
"eval_runtime": 1.8836, |
|
"eval_samples_per_second": 22.298, |
|
"eval_steps_per_second": 1.593, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 53.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3284671532846715, |
|
"eval_loss": 0.6027652621269226, |
|
"eval_roc_auc": 0.6928053830227744, |
|
"eval_runtime": 1.8924, |
|
"eval_samples_per_second": 22.194, |
|
"eval_steps_per_second": 1.585, |
|
"step": 74 |
|
}, |
|
{ |
|
"epoch": 54.55, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3284671532846715, |
|
"eval_loss": 0.6037685871124268, |
|
"eval_roc_auc": 0.6928053830227744, |
|
"eval_runtime": 1.8574, |
|
"eval_samples_per_second": 22.612, |
|
"eval_steps_per_second": 1.615, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.31970260223048325, |
|
"eval_loss": 0.6055669188499451, |
|
"eval_roc_auc": 0.6824534161490683, |
|
"eval_runtime": 2.0249, |
|
"eval_samples_per_second": 20.742, |
|
"eval_steps_per_second": 1.482, |
|
"step": 77 |
|
}, |
|
{ |
|
"epoch": 56.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3249097472924187, |
|
"eval_loss": 0.6073567867279053, |
|
"eval_roc_auc": 0.6912525879917184, |
|
"eval_runtime": 1.9844, |
|
"eval_samples_per_second": 21.165, |
|
"eval_steps_per_second": 1.512, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 57.45, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3157894736842105, |
|
"eval_loss": 0.6030458807945251, |
|
"eval_roc_auc": 0.677536231884058, |
|
"eval_runtime": 1.8981, |
|
"eval_samples_per_second": 22.127, |
|
"eval_steps_per_second": 1.581, |
|
"step": 79 |
|
}, |
|
{ |
|
"epoch": 58.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3358778625954198, |
|
"eval_loss": 0.6000563502311707, |
|
"eval_roc_auc": 0.6925465838509317, |
|
"eval_runtime": 2.137, |
|
"eval_samples_per_second": 19.653, |
|
"eval_steps_per_second": 1.404, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 59.64, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3409090909090909, |
|
"eval_loss": 0.5992631316184998, |
|
"eval_roc_auc": 0.6979813664596273, |
|
"eval_runtime": 1.8122, |
|
"eval_samples_per_second": 23.177, |
|
"eval_steps_per_second": 1.655, |
|
"step": 82 |
|
}, |
|
{ |
|
"epoch": 60.36, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.32592592592592595, |
|
"eval_loss": 0.6017413139343262, |
|
"eval_roc_auc": 0.6884057971014492, |
|
"eval_runtime": 2.0667, |
|
"eval_samples_per_second": 20.323, |
|
"eval_steps_per_second": 1.452, |
|
"step": 83 |
|
}, |
|
{ |
|
"epoch": 61.82, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3146067415730337, |
|
"eval_loss": 0.6009005308151245, |
|
"eval_roc_auc": 0.6770186335403726, |
|
"eval_runtime": 1.9156, |
|
"eval_samples_per_second": 21.925, |
|
"eval_steps_per_second": 1.566, |
|
"step": 85 |
|
}, |
|
{ |
|
"epoch": 62.55, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.31970260223048325, |
|
"eval_loss": 0.6017952561378479, |
|
"eval_roc_auc": 0.6824534161490683, |
|
"eval_runtime": 1.9734, |
|
"eval_samples_per_second": 21.283, |
|
"eval_steps_per_second": 1.52, |
|
"step": 86 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3129770992366412, |
|
"eval_loss": 0.5975026488304138, |
|
"eval_roc_auc": 0.6731366459627329, |
|
"eval_runtime": 1.9304, |
|
"eval_samples_per_second": 21.757, |
|
"eval_steps_per_second": 1.554, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 64.73, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3271375464684015, |
|
"eval_loss": 0.5978490710258484, |
|
"eval_roc_auc": 0.6889233954451346, |
|
"eval_runtime": 1.993, |
|
"eval_samples_per_second": 21.073, |
|
"eval_steps_per_second": 1.505, |
|
"step": 89 |
|
}, |
|
{ |
|
"epoch": 65.45, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.34241245136186765, |
|
"eval_loss": 0.5966595411300659, |
|
"eval_roc_auc": 0.6951345755693582, |
|
"eval_runtime": 1.8441, |
|
"eval_samples_per_second": 22.775, |
|
"eval_steps_per_second": 1.627, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 66.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3125, |
|
"eval_loss": 0.5973162055015564, |
|
"eval_roc_auc": 0.6697722567287785, |
|
"eval_runtime": 1.9347, |
|
"eval_samples_per_second": 21.708, |
|
"eval_steps_per_second": 1.551, |
|
"step": 92 |
|
}, |
|
{ |
|
"epoch": 67.64, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3371647509578544, |
|
"eval_loss": 0.5955641865730286, |
|
"eval_roc_auc": 0.693064182194617, |
|
"eval_runtime": 1.9179, |
|
"eval_samples_per_second": 21.899, |
|
"eval_steps_per_second": 1.564, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 68.36, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3372549019607843, |
|
"eval_loss": 0.5921858549118042, |
|
"eval_roc_auc": 0.6896997929606625, |
|
"eval_runtime": 1.9017, |
|
"eval_samples_per_second": 22.086, |
|
"eval_steps_per_second": 1.578, |
|
"step": 94 |
|
}, |
|
{ |
|
"epoch": 69.82, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.33201581027667987, |
|
"eval_loss": 0.5948788523674011, |
|
"eval_roc_auc": 0.6842650103519669, |
|
"eval_runtime": 1.8776, |
|
"eval_samples_per_second": 22.369, |
|
"eval_steps_per_second": 1.598, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 70.55, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3412698412698413, |
|
"eval_loss": 0.5959014892578125, |
|
"eval_roc_auc": 0.6912525879917184, |
|
"eval_runtime": 2.0178, |
|
"eval_samples_per_second": 20.814, |
|
"eval_steps_per_second": 1.487, |
|
"step": 97 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3420074349442379, |
|
"eval_loss": 0.5944311022758484, |
|
"eval_roc_auc": 0.7018633540372671, |
|
"eval_runtime": 1.8838, |
|
"eval_samples_per_second": 22.295, |
|
"eval_steps_per_second": 1.593, |
|
"step": 99 |
|
}, |
|
{ |
|
"epoch": 72.73, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3333333333333333, |
|
"eval_loss": 0.5955294370651245, |
|
"eval_roc_auc": 0.6881469979296065, |
|
"eval_runtime": 2.0716, |
|
"eval_samples_per_second": 20.275, |
|
"eval_steps_per_second": 1.448, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 73.45, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3346303501945525, |
|
"eval_loss": 0.5932918190956116, |
|
"eval_roc_auc": 0.6886645962732919, |
|
"eval_runtime": 1.9689, |
|
"eval_samples_per_second": 21.332, |
|
"eval_steps_per_second": 1.524, |
|
"step": 101 |
|
}, |
|
{ |
|
"epoch": 74.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3543307086614173, |
|
"eval_loss": 0.5894082188606262, |
|
"eval_roc_auc": 0.7031573498964803, |
|
"eval_runtime": 2.0135, |
|
"eval_samples_per_second": 20.859, |
|
"eval_steps_per_second": 1.49, |
|
"step": 103 |
|
}, |
|
{ |
|
"epoch": 75.64, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.34241245136186765, |
|
"eval_loss": 0.5903118848800659, |
|
"eval_roc_auc": 0.6951345755693582, |
|
"eval_runtime": 1.8434, |
|
"eval_samples_per_second": 22.784, |
|
"eval_steps_per_second": 1.627, |
|
"step": 104 |
|
}, |
|
{ |
|
"epoch": 76.36, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3410852713178295, |
|
"eval_loss": 0.5889719128608704, |
|
"eval_roc_auc": 0.694616977225673, |
|
"eval_runtime": 2.0369, |
|
"eval_samples_per_second": 20.62, |
|
"eval_steps_per_second": 1.473, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 77.82, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3346303501945525, |
|
"eval_loss": 0.5922066569328308, |
|
"eval_roc_auc": 0.6886645962732919, |
|
"eval_runtime": 1.8672, |
|
"eval_samples_per_second": 22.493, |
|
"eval_steps_per_second": 1.607, |
|
"step": 107 |
|
}, |
|
{ |
|
"epoch": 78.55, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.32432432432432434, |
|
"eval_loss": 0.5923347473144531, |
|
"eval_roc_auc": 0.6811594202898552, |
|
"eval_runtime": 2.0697, |
|
"eval_samples_per_second": 20.293, |
|
"eval_steps_per_second": 1.449, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3467741935483871, |
|
"eval_loss": 0.590828537940979, |
|
"eval_roc_auc": 0.6933229813664595, |
|
"eval_runtime": 1.8922, |
|
"eval_samples_per_second": 22.196, |
|
"eval_steps_per_second": 1.585, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 80.73, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.328, |
|
"eval_loss": 0.5922424793243408, |
|
"eval_roc_auc": 0.6793478260869565, |
|
"eval_runtime": 2.0683, |
|
"eval_samples_per_second": 20.307, |
|
"eval_steps_per_second": 1.45, |
|
"step": 111 |
|
}, |
|
{ |
|
"epoch": 81.45, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.34400000000000003, |
|
"eval_loss": 0.5891572833061218, |
|
"eval_roc_auc": 0.692287784679089, |
|
"eval_runtime": 1.8345, |
|
"eval_samples_per_second": 22.894, |
|
"eval_steps_per_second": 1.635, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 82.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.35059760956175307, |
|
"eval_loss": 0.5879591703414917, |
|
"eval_roc_auc": 0.69824016563147, |
|
"eval_runtime": 1.9744, |
|
"eval_samples_per_second": 21.272, |
|
"eval_steps_per_second": 1.519, |
|
"step": 114 |
|
}, |
|
{ |
|
"epoch": 83.64, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.34538152610441764, |
|
"eval_loss": 0.5868695378303528, |
|
"eval_roc_auc": 0.6928053830227743, |
|
"eval_runtime": 1.943, |
|
"eval_samples_per_second": 21.616, |
|
"eval_steps_per_second": 1.544, |
|
"step": 115 |
|
}, |
|
{ |
|
"epoch": 84.36, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3464566929133858, |
|
"eval_loss": 0.5840514302253723, |
|
"eval_roc_auc": 0.6966873706004141, |
|
"eval_runtime": 2.0388, |
|
"eval_samples_per_second": 20.6, |
|
"eval_steps_per_second": 1.471, |
|
"step": 116 |
|
}, |
|
{ |
|
"epoch": 85.82, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.35684647302904565, |
|
"eval_loss": 0.5840616226196289, |
|
"eval_roc_auc": 0.6969461697722568, |
|
"eval_runtime": 1.9152, |
|
"eval_samples_per_second": 21.93, |
|
"eval_steps_per_second": 1.566, |
|
"step": 118 |
|
}, |
|
{ |
|
"epoch": 86.55, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3495934959349593, |
|
"eval_loss": 0.5842622518539429, |
|
"eval_roc_auc": 0.6943581780538302, |
|
"eval_runtime": 2.0014, |
|
"eval_samples_per_second": 20.985, |
|
"eval_steps_per_second": 1.499, |
|
"step": 119 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3598326359832636, |
|
"eval_loss": 0.5860231518745422, |
|
"eval_roc_auc": 0.6979813664596273, |
|
"eval_runtime": 1.7516, |
|
"eval_samples_per_second": 23.978, |
|
"eval_steps_per_second": 1.713, |
|
"step": 121 |
|
}, |
|
{ |
|
"epoch": 88.73, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.34567901234567905, |
|
"eval_loss": 0.5837295055389404, |
|
"eval_roc_auc": 0.6894409937888197, |
|
"eval_runtime": 2.0716, |
|
"eval_samples_per_second": 20.275, |
|
"eval_steps_per_second": 1.448, |
|
"step": 122 |
|
}, |
|
{ |
|
"epoch": 89.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3636363636363636, |
|
"eval_loss": 0.5826032161712646, |
|
"eval_roc_auc": 0.7028985507246376, |
|
"eval_runtime": 2.155, |
|
"eval_samples_per_second": 19.49, |
|
"eval_steps_per_second": 1.392, |
|
"step": 123 |
|
}, |
|
{ |
|
"epoch": 90.91, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3651452282157676, |
|
"eval_loss": 0.5821616053581238, |
|
"eval_roc_auc": 0.7034161490683231, |
|
"eval_runtime": 1.8665, |
|
"eval_samples_per_second": 22.502, |
|
"eval_steps_per_second": 1.607, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 91.64, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.36065573770491804, |
|
"eval_loss": 0.5813528299331665, |
|
"eval_roc_auc": 0.701863354037267, |
|
"eval_runtime": 2.0722, |
|
"eval_samples_per_second": 20.268, |
|
"eval_steps_per_second": 1.448, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 92.36, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3629032258064516, |
|
"eval_loss": 0.5813586115837097, |
|
"eval_roc_auc": 0.7062629399585921, |
|
"eval_runtime": 1.8413, |
|
"eval_samples_per_second": 22.809, |
|
"eval_steps_per_second": 1.629, |
|
"step": 127 |
|
}, |
|
{ |
|
"epoch": 93.82, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.37130801687763715, |
|
"eval_loss": 0.5817737579345703, |
|
"eval_roc_auc": 0.7054865424430642, |
|
"eval_runtime": 2.0383, |
|
"eval_samples_per_second": 20.605, |
|
"eval_steps_per_second": 1.472, |
|
"step": 129 |
|
}, |
|
{ |
|
"epoch": 94.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3765690376569037, |
|
"eval_loss": 0.5802175402641296, |
|
"eval_roc_auc": 0.7109213250517598, |
|
"eval_runtime": 1.9338, |
|
"eval_samples_per_second": 21.718, |
|
"eval_steps_per_second": 1.551, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.36752136752136755, |
|
"eval_loss": 0.5802630186080933, |
|
"eval_roc_auc": 0.7005693581780539, |
|
"eval_runtime": 1.9997, |
|
"eval_samples_per_second": 21.003, |
|
"eval_steps_per_second": 1.5, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 96.73, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.351931330472103, |
|
"eval_loss": 0.5825139880180359, |
|
"eval_roc_auc": 0.6881469979296067, |
|
"eval_runtime": 2.0169, |
|
"eval_samples_per_second": 20.824, |
|
"eval_steps_per_second": 1.487, |
|
"step": 133 |
|
}, |
|
{ |
|
"epoch": 97.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3628691983122363, |
|
"eval_loss": 0.5789888501167297, |
|
"eval_roc_auc": 0.6990165631469979, |
|
"eval_runtime": 2.0766, |
|
"eval_samples_per_second": 20.225, |
|
"eval_steps_per_second": 1.445, |
|
"step": 134 |
|
}, |
|
{ |
|
"epoch": 98.91, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3765690376569037, |
|
"eval_loss": 0.5794755816459656, |
|
"eval_roc_auc": 0.7109213250517598, |
|
"eval_runtime": 1.8413, |
|
"eval_samples_per_second": 22.81, |
|
"eval_steps_per_second": 1.629, |
|
"step": 136 |
|
}, |
|
{ |
|
"epoch": 99.64, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3697478991596639, |
|
"eval_loss": 0.5784409642219543, |
|
"eval_roc_auc": 0.7049689440993788, |
|
"eval_runtime": 2.0156, |
|
"eval_samples_per_second": 20.837, |
|
"eval_steps_per_second": 1.488, |
|
"step": 137 |
|
}, |
|
{ |
|
"epoch": 100.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.35833333333333334, |
|
"eval_loss": 0.5818943977355957, |
|
"eval_roc_auc": 0.697463768115942, |
|
"eval_runtime": 1.8187, |
|
"eval_samples_per_second": 23.093, |
|
"eval_steps_per_second": 1.65, |
|
"step": 138 |
|
}, |
|
{ |
|
"epoch": 101.82, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.35245901639344257, |
|
"eval_loss": 0.5833745002746582, |
|
"eval_roc_auc": 0.6953933747412008, |
|
"eval_runtime": 2.073, |
|
"eval_samples_per_second": 20.261, |
|
"eval_steps_per_second": 1.447, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 102.55, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3688524590163934, |
|
"eval_loss": 0.5825251340866089, |
|
"eval_roc_auc": 0.7083333333333333, |
|
"eval_runtime": 1.9912, |
|
"eval_samples_per_second": 21.093, |
|
"eval_steps_per_second": 1.507, |
|
"step": 141 |
|
}, |
|
{ |
|
"epoch": 104.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3459915611814346, |
|
"eval_loss": 0.5839240550994873, |
|
"eval_roc_auc": 0.6860766045548654, |
|
"eval_runtime": 2.1002, |
|
"eval_samples_per_second": 19.998, |
|
"eval_steps_per_second": 1.428, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 104.73, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3333333333333333, |
|
"eval_loss": 0.5838228464126587, |
|
"eval_roc_auc": 0.6814182194616977, |
|
"eval_runtime": 1.9156, |
|
"eval_samples_per_second": 21.926, |
|
"eval_steps_per_second": 1.566, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 105.45, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.33870967741935487, |
|
"eval_loss": 0.580091655254364, |
|
"eval_roc_auc": 0.6868530020703933, |
|
"eval_runtime": 2.1494, |
|
"eval_samples_per_second": 19.541, |
|
"eval_steps_per_second": 1.396, |
|
"step": 145 |
|
}, |
|
{ |
|
"epoch": 106.91, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.35146443514644354, |
|
"eval_loss": 0.581135630607605, |
|
"eval_roc_auc": 0.6915113871635612, |
|
"eval_runtime": 1.8396, |
|
"eval_samples_per_second": 22.831, |
|
"eval_steps_per_second": 1.631, |
|
"step": 147 |
|
}, |
|
{ |
|
"epoch": 107.64, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3374485596707819, |
|
"eval_loss": 0.5792709589004517, |
|
"eval_roc_auc": 0.6829710144927537, |
|
"eval_runtime": 2.1328, |
|
"eval_samples_per_second": 19.693, |
|
"eval_steps_per_second": 1.407, |
|
"step": 148 |
|
}, |
|
{ |
|
"epoch": 108.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3448275862068966, |
|
"eval_loss": 0.5765911936759949, |
|
"eval_roc_auc": 0.6821946169772257, |
|
"eval_runtime": 2.0548, |
|
"eval_samples_per_second": 20.44, |
|
"eval_steps_per_second": 1.46, |
|
"step": 149 |
|
}, |
|
{ |
|
"epoch": 109.82, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.34453781512605036, |
|
"eval_loss": 0.5759981870651245, |
|
"eval_roc_auc": 0.6855590062111802, |
|
"eval_runtime": 2.1017, |
|
"eval_samples_per_second": 19.984, |
|
"eval_steps_per_second": 1.427, |
|
"step": 151 |
|
}, |
|
{ |
|
"epoch": 110.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3559322033898305, |
|
"eval_loss": 0.5757153034210205, |
|
"eval_roc_auc": 0.693064182194617, |
|
"eval_runtime": 1.8256, |
|
"eval_samples_per_second": 23.006, |
|
"eval_steps_per_second": 1.643, |
|
"step": 152 |
|
}, |
|
{ |
|
"epoch": 112.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3474576271186441, |
|
"eval_loss": 0.5759687423706055, |
|
"eval_roc_auc": 0.6865942028985509, |
|
"eval_runtime": 1.998, |
|
"eval_samples_per_second": 21.021, |
|
"eval_steps_per_second": 1.502, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 112.73, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3628691983122363, |
|
"eval_loss": 0.5742767453193665, |
|
"eval_roc_auc": 0.6990165631469979, |
|
"eval_runtime": 2.0687, |
|
"eval_samples_per_second": 20.303, |
|
"eval_steps_per_second": 1.45, |
|
"step": 155 |
|
}, |
|
{ |
|
"epoch": 113.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3636363636363636, |
|
"eval_loss": 0.5731971263885498, |
|
"eval_roc_auc": 0.7028985507246376, |
|
"eval_runtime": 1.9431, |
|
"eval_samples_per_second": 21.615, |
|
"eval_steps_per_second": 1.544, |
|
"step": 156 |
|
}, |
|
{ |
|
"epoch": 114.91, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.37860082304526754, |
|
"eval_loss": 0.5735821723937988, |
|
"eval_roc_auc": 0.7153209109730849, |
|
"eval_runtime": 2.067, |
|
"eval_samples_per_second": 20.32, |
|
"eval_steps_per_second": 1.451, |
|
"step": 158 |
|
}, |
|
{ |
|
"epoch": 115.64, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.36666666666666664, |
|
"eval_loss": 0.5763630867004395, |
|
"eval_roc_auc": 0.7039337474120083, |
|
"eval_runtime": 1.876, |
|
"eval_samples_per_second": 22.388, |
|
"eval_steps_per_second": 1.599, |
|
"step": 159 |
|
}, |
|
{ |
|
"epoch": 116.36, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.361344537815126, |
|
"eval_loss": 0.5764896273612976, |
|
"eval_roc_auc": 0.6984989648033126, |
|
"eval_runtime": 2.186, |
|
"eval_samples_per_second": 19.213, |
|
"eval_steps_per_second": 1.372, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 117.82, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.35744680851063826, |
|
"eval_loss": 0.5749201774597168, |
|
"eval_roc_auc": 0.6935817805383023, |
|
"eval_runtime": 1.8855, |
|
"eval_samples_per_second": 22.276, |
|
"eval_steps_per_second": 1.591, |
|
"step": 162 |
|
}, |
|
{ |
|
"epoch": 118.55, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3591836734693878, |
|
"eval_loss": 0.5753706693649292, |
|
"eval_roc_auc": 0.7013457556935817, |
|
"eval_runtime": 2.0351, |
|
"eval_samples_per_second": 20.637, |
|
"eval_steps_per_second": 1.474, |
|
"step": 163 |
|
}, |
|
{ |
|
"epoch": 120.0, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3665338645418327, |
|
"eval_loss": 0.5756567120552063, |
|
"eval_roc_auc": 0.7111801242236024, |
|
"eval_runtime": 1.777, |
|
"eval_samples_per_second": 23.636, |
|
"eval_steps_per_second": 1.688, |
|
"step": 165 |
|
}, |
|
{ |
|
"epoch": 120.73, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3728813559322034, |
|
"eval_loss": 0.5771237015724182, |
|
"eval_roc_auc": 0.7060041407867494, |
|
"eval_runtime": 2.0719, |
|
"eval_samples_per_second": 20.271, |
|
"eval_steps_per_second": 1.448, |
|
"step": 166 |
|
}, |
|
{ |
|
"epoch": 121.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3628691983122363, |
|
"eval_loss": 0.5745561122894287, |
|
"eval_roc_auc": 0.6990165631469979, |
|
"eval_runtime": 1.8367, |
|
"eval_samples_per_second": 22.867, |
|
"eval_steps_per_second": 1.633, |
|
"step": 167 |
|
}, |
|
{ |
|
"epoch": 122.91, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.36440677966101687, |
|
"eval_loss": 0.5757673382759094, |
|
"eval_roc_auc": 0.6995341614906831, |
|
"eval_runtime": 2.032, |
|
"eval_samples_per_second": 20.669, |
|
"eval_steps_per_second": 1.476, |
|
"step": 169 |
|
}, |
|
{ |
|
"epoch": 123.64, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3559322033898305, |
|
"eval_loss": 0.5745112299919128, |
|
"eval_roc_auc": 0.693064182194617, |
|
"eval_runtime": 1.8329, |
|
"eval_samples_per_second": 22.914, |
|
"eval_steps_per_second": 1.637, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 124.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.35443037974683544, |
|
"eval_loss": 0.5758460164070129, |
|
"eval_roc_auc": 0.6925465838509317, |
|
"eval_runtime": 2.0956, |
|
"eval_samples_per_second": 20.042, |
|
"eval_steps_per_second": 1.432, |
|
"step": 171 |
|
}, |
|
{ |
|
"epoch": 125.82, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3598326359832636, |
|
"eval_loss": 0.5759280323982239, |
|
"eval_roc_auc": 0.6979813664596273, |
|
"eval_runtime": 1.9931, |
|
"eval_samples_per_second": 21.072, |
|
"eval_steps_per_second": 1.505, |
|
"step": 173 |
|
}, |
|
{ |
|
"epoch": 126.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.35684647302904565, |
|
"eval_loss": 0.5771880149841309, |
|
"eval_roc_auc": 0.6969461697722568, |
|
"eval_runtime": 1.9762, |
|
"eval_samples_per_second": 21.253, |
|
"eval_steps_per_second": 1.518, |
|
"step": 174 |
|
}, |
|
{ |
|
"epoch": 128.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.35833333333333334, |
|
"eval_loss": 0.5747218132019043, |
|
"eval_roc_auc": 0.697463768115942, |
|
"eval_runtime": 2.0367, |
|
"eval_samples_per_second": 20.622, |
|
"eval_steps_per_second": 1.473, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 128.73, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.36440677966101687, |
|
"eval_loss": 0.5737968683242798, |
|
"eval_roc_auc": 0.6995341614906831, |
|
"eval_runtime": 1.802, |
|
"eval_samples_per_second": 23.307, |
|
"eval_steps_per_second": 1.665, |
|
"step": 177 |
|
}, |
|
{ |
|
"epoch": 129.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.36440677966101687, |
|
"eval_loss": 0.575109601020813, |
|
"eval_roc_auc": 0.6995341614906831, |
|
"eval_runtime": 2.0006, |
|
"eval_samples_per_second": 20.993, |
|
"eval_steps_per_second": 1.5, |
|
"step": 178 |
|
}, |
|
{ |
|
"epoch": 130.91, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.37130801687763715, |
|
"eval_loss": 0.5740981101989746, |
|
"eval_roc_auc": 0.7054865424430642, |
|
"eval_runtime": 1.7241, |
|
"eval_samples_per_second": 24.361, |
|
"eval_steps_per_second": 1.74, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 131.64, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.37130801687763715, |
|
"eval_loss": 0.5748480558395386, |
|
"eval_roc_auc": 0.7054865424430642, |
|
"eval_runtime": 2.2478, |
|
"eval_samples_per_second": 18.685, |
|
"eval_steps_per_second": 1.335, |
|
"step": 181 |
|
}, |
|
{ |
|
"epoch": 132.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3659574468085106, |
|
"eval_loss": 0.5767146944999695, |
|
"eval_roc_auc": 0.7000517598343685, |
|
"eval_runtime": 1.9197, |
|
"eval_samples_per_second": 21.879, |
|
"eval_steps_per_second": 1.563, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 133.82, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3659574468085106, |
|
"eval_loss": 0.5731571316719055, |
|
"eval_roc_auc": 0.7000517598343685, |
|
"eval_runtime": 1.8071, |
|
"eval_samples_per_second": 23.241, |
|
"eval_steps_per_second": 1.66, |
|
"step": 184 |
|
}, |
|
{ |
|
"epoch": 134.55, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3771929824561403, |
|
"eval_loss": 0.5742261409759521, |
|
"eval_roc_auc": 0.7036749482401656, |
|
"eval_runtime": 2.2015, |
|
"eval_samples_per_second": 19.078, |
|
"eval_steps_per_second": 1.363, |
|
"step": 185 |
|
}, |
|
{ |
|
"epoch": 136.0, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.37554585152838427, |
|
"eval_loss": 0.5690290927886963, |
|
"eval_roc_auc": 0.7031573498964804, |
|
"eval_runtime": 2.2207, |
|
"eval_samples_per_second": 18.913, |
|
"eval_steps_per_second": 1.351, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 136.73, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3805309734513274, |
|
"eval_loss": 0.5698773264884949, |
|
"eval_roc_auc": 0.7047101449275363, |
|
"eval_runtime": 2.491, |
|
"eval_samples_per_second": 16.861, |
|
"eval_steps_per_second": 1.204, |
|
"step": 188 |
|
}, |
|
{ |
|
"epoch": 137.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.37068965517241376, |
|
"eval_loss": 0.5743153095245361, |
|
"eval_roc_auc": 0.7016045548654244, |
|
"eval_runtime": 2.2065, |
|
"eval_samples_per_second": 19.034, |
|
"eval_steps_per_second": 1.36, |
|
"step": 189 |
|
}, |
|
{ |
|
"epoch": 138.91, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3529411764705882, |
|
"eval_loss": 0.5739556550979614, |
|
"eval_roc_auc": 0.6920289855072465, |
|
"eval_runtime": 2.1255, |
|
"eval_samples_per_second": 19.76, |
|
"eval_steps_per_second": 1.411, |
|
"step": 191 |
|
}, |
|
{ |
|
"epoch": 139.64, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3659574468085106, |
|
"eval_loss": 0.5739744901657104, |
|
"eval_roc_auc": 0.7000517598343685, |
|
"eval_runtime": 2.0832, |
|
"eval_samples_per_second": 20.161, |
|
"eval_steps_per_second": 1.44, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 140.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.36440677966101687, |
|
"eval_loss": 0.5733990669250488, |
|
"eval_roc_auc": 0.6995341614906831, |
|
"eval_runtime": 2.021, |
|
"eval_samples_per_second": 20.782, |
|
"eval_steps_per_second": 1.484, |
|
"step": 193 |
|
}, |
|
{ |
|
"epoch": 141.82, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.36752136752136755, |
|
"eval_loss": 0.5739865303039551, |
|
"eval_roc_auc": 0.7005693581780539, |
|
"eval_runtime": 2.0466, |
|
"eval_samples_per_second": 20.522, |
|
"eval_steps_per_second": 1.466, |
|
"step": 195 |
|
}, |
|
{ |
|
"epoch": 142.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.37068965517241376, |
|
"eval_loss": 0.5721157789230347, |
|
"eval_roc_auc": 0.7016045548654244, |
|
"eval_runtime": 1.8265, |
|
"eval_samples_per_second": 22.994, |
|
"eval_steps_per_second": 1.642, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 144.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3766816143497758, |
|
"eval_loss": 0.5724892020225525, |
|
"eval_roc_auc": 0.6997929606625258, |
|
"eval_runtime": 2.0667, |
|
"eval_samples_per_second": 20.323, |
|
"eval_steps_per_second": 1.452, |
|
"step": 198 |
|
}, |
|
{ |
|
"epoch": 144.73, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3728813559322034, |
|
"eval_loss": 0.5734347105026245, |
|
"eval_roc_auc": 0.7060041407867494, |
|
"eval_runtime": 1.798, |
|
"eval_samples_per_second": 23.359, |
|
"eval_steps_per_second": 1.669, |
|
"step": 199 |
|
}, |
|
{ |
|
"epoch": 145.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3628691983122363, |
|
"eval_loss": 0.575474202632904, |
|
"eval_roc_auc": 0.6990165631469979, |
|
"eval_runtime": 2.2459, |
|
"eval_samples_per_second": 18.701, |
|
"eval_steps_per_second": 1.336, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 145.45, |
|
"step": 200, |
|
"total_flos": 1.357171875053568e+17, |
|
"train_loss": 0.5662997841835022, |
|
"train_runtime": 1746.9239, |
|
"train_samples_per_second": 19.005, |
|
"train_steps_per_second": 0.114 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 200, |
|
"num_train_epochs": 200, |
|
"save_steps": 500, |
|
"total_flos": 1.357171875053568e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|