{ "best_metric": 0.3805309734513274, "best_model_checkpoint": "car_identified_model_7/checkpoint-188", "epoch": 145.45454545454547, "eval_steps": 500, "global_step": 200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.73, "learning_rate": 1.9900000000000003e-05, "loss": 0.6919, "step": 1 }, { "epoch": 0.73, "eval_accuracy": 0.0, "eval_f1": 0.17857142857142858, "eval_loss": 0.6887282133102417, "eval_roc_auc": 0.5737577639751552, "eval_runtime": 2.8648, "eval_samples_per_second": 14.661, "eval_steps_per_second": 1.047, "step": 1 }, { "epoch": 1.45, "eval_accuracy": 0.0, "eval_f1": 0.1818181818181818, "eval_loss": 0.6855647563934326, "eval_roc_auc": 0.5760869565217391, "eval_runtime": 2.5822, "eval_samples_per_second": 16.265, "eval_steps_per_second": 1.162, "step": 2 }, { "epoch": 2.91, "eval_accuracy": 0.0, "eval_f1": 0.21164021164021166, "eval_loss": 0.6802406311035156, "eval_roc_auc": 0.6066252587991718, "eval_runtime": 2.1976, "eval_samples_per_second": 19.112, "eval_steps_per_second": 1.365, "step": 4 }, { "epoch": 3.64, "eval_accuracy": 0.0, "eval_f1": 0.18614718614718614, "eval_loss": 0.6800228953361511, "eval_roc_auc": 0.5825569358178053, "eval_runtime": 2.1512, "eval_samples_per_second": 19.524, "eval_steps_per_second": 1.395, "step": 5 }, { "epoch": 4.36, "eval_accuracy": 0.0, "eval_f1": 0.1904761904761905, "eval_loss": 0.6858328580856323, "eval_roc_auc": 0.5973084886128365, "eval_runtime": 1.8993, "eval_samples_per_second": 22.113, "eval_steps_per_second": 1.58, "step": 6 }, { "epoch": 5.82, "eval_accuracy": 0.0, "eval_f1": 0.15492957746478872, "eval_loss": 0.693770706653595, "eval_roc_auc": 0.5341614906832298, "eval_runtime": 1.986, "eval_samples_per_second": 21.148, "eval_steps_per_second": 1.511, "step": 8 }, { "epoch": 6.55, "eval_accuracy": 0.0, "eval_f1": 0.18050541516245489, "eval_loss": 0.6917278170585632, "eval_roc_auc": 0.5802277432712216, "eval_runtime": 1.8331, "eval_samples_per_second": 22.911, "eval_steps_per_second": 1.637, "step": 9 }, { "epoch": 8.0, "eval_accuracy": 0.0, "eval_f1": 0.19047619047619044, "eval_loss": 0.6735165119171143, "eval_roc_auc": 0.593167701863354, "eval_runtime": 2.0579, "eval_samples_per_second": 20.409, "eval_steps_per_second": 1.458, "step": 11 }, { "epoch": 8.73, "eval_accuracy": 0.0, "eval_f1": 0.1952191235059761, "eval_loss": 0.6727393865585327, "eval_roc_auc": 0.6006728778467909, "eval_runtime": 1.8528, "eval_samples_per_second": 22.669, "eval_steps_per_second": 1.619, "step": 12 }, { "epoch": 9.45, "eval_accuracy": 0.0, "eval_f1": 0.20606060606060606, "eval_loss": 0.6698008179664612, "eval_roc_auc": 0.6172360248447204, "eval_runtime": 2.0897, "eval_samples_per_second": 20.099, "eval_steps_per_second": 1.436, "step": 13 }, { "epoch": 10.91, "eval_accuracy": 0.0, "eval_f1": 0.20080321285140562, "eval_loss": 0.6671529412269592, "eval_roc_auc": 0.6092132505175983, "eval_runtime": 1.8899, "eval_samples_per_second": 22.224, "eval_steps_per_second": 1.587, "step": 15 }, { "epoch": 11.64, "eval_accuracy": 0.0, "eval_f1": 0.2092050209205021, "eval_loss": 0.6645169854164124, "eval_roc_auc": 0.6195652173913044, "eval_runtime": 1.9211, "eval_samples_per_second": 21.863, "eval_steps_per_second": 1.562, "step": 16 }, { "epoch": 12.36, "eval_accuracy": 0.0, "eval_f1": 0.20491803278688525, "eval_loss": 0.6645674705505371, "eval_roc_auc": 0.6143892339544513, "eval_runtime": 1.9806, "eval_samples_per_second": 21.206, "eval_steps_per_second": 1.515, "step": 17 }, { "epoch": 13.82, "eval_accuracy": 0.0, "eval_f1": 0.208067940552017, "eval_loss": 0.6622694134712219, "eval_roc_auc": 0.6167184265010353, "eval_runtime": 2.0813, "eval_samples_per_second": 20.179, "eval_steps_per_second": 1.441, "step": 19 }, { "epoch": 14.55, "eval_accuracy": 0.0, "eval_f1": 0.20779220779220778, "eval_loss": 0.6606575846672058, "eval_roc_auc": 0.6149068322981366, "eval_runtime": 1.8418, "eval_samples_per_second": 22.803, "eval_steps_per_second": 1.629, "step": 20 }, { "epoch": 16.0, "eval_accuracy": 0.0, "eval_f1": 0.22026431718061673, "eval_loss": 0.6584673523902893, "eval_roc_auc": 0.6319875776397516, "eval_runtime": 2.024, "eval_samples_per_second": 20.751, "eval_steps_per_second": 1.482, "step": 22 }, { "epoch": 16.73, "eval_accuracy": 0.0, "eval_f1": 0.21559633027522934, "eval_loss": 0.6561669111251831, "eval_roc_auc": 0.6218944099378882, "eval_runtime": 1.8303, "eval_samples_per_second": 22.947, "eval_steps_per_second": 1.639, "step": 23 }, { "epoch": 17.45, "eval_accuracy": 0.0, "eval_f1": 0.21818181818181817, "eval_loss": 0.6555350422859192, "eval_roc_auc": 0.6262939958592133, "eval_runtime": 1.9854, "eval_samples_per_second": 21.154, "eval_steps_per_second": 1.511, "step": 24 }, { "epoch": 18.91, "eval_accuracy": 0.0, "eval_f1": 0.2185273159144893, "eval_loss": 0.652241051197052, "eval_roc_auc": 0.6231884057971014, "eval_runtime": 1.9789, "eval_samples_per_second": 21.224, "eval_steps_per_second": 1.516, "step": 26 }, { "epoch": 19.64, "eval_accuracy": 0.0, "eval_f1": 0.22276029055690072, "eval_loss": 0.6512007713317871, "eval_roc_auc": 0.6273291925465838, "eval_runtime": 2.0333, "eval_samples_per_second": 20.656, "eval_steps_per_second": 1.475, "step": 27 }, { "epoch": 20.36, "eval_accuracy": 0.0, "eval_f1": 0.23558897243107768, "eval_loss": 0.6501262187957764, "eval_roc_auc": 0.6410455486542443, "eval_runtime": 2.1299, "eval_samples_per_second": 19.719, "eval_steps_per_second": 1.409, "step": 28 }, { "epoch": 21.82, "eval_accuracy": 0.0, "eval_f1": 0.22797927461139897, "eval_loss": 0.6477265357971191, "eval_roc_auc": 0.6283643892339545, "eval_runtime": 1.8983, "eval_samples_per_second": 22.125, "eval_steps_per_second": 1.58, "step": 30 }, { "epoch": 22.55, "eval_accuracy": 0.0, "eval_f1": 0.23255813953488372, "eval_loss": 0.6476041078567505, "eval_roc_auc": 0.6343167701863355, "eval_runtime": 2.1591, "eval_samples_per_second": 19.452, "eval_steps_per_second": 1.389, "step": 31 }, { "epoch": 24.0, "eval_accuracy": 0.0, "eval_f1": 0.24083769633507857, "eval_loss": 0.6469409465789795, "eval_roc_auc": 0.6433747412008282, "eval_runtime": 1.8477, "eval_samples_per_second": 22.731, "eval_steps_per_second": 1.624, "step": 33 }, { "epoch": 24.73, "eval_accuracy": 0.0, "eval_f1": 0.24089635854341737, "eval_loss": 0.6432453393936157, "eval_roc_auc": 0.6369047619047619, "eval_runtime": 2.1797, "eval_samples_per_second": 19.268, "eval_steps_per_second": 1.376, "step": 34 }, { "epoch": 25.45, "eval_accuracy": 0.0, "eval_f1": 0.2430939226519337, "eval_loss": 0.6432364583015442, "eval_roc_auc": 0.6407867494824016, "eval_runtime": 1.9386, "eval_samples_per_second": 21.665, "eval_steps_per_second": 1.547, "step": 35 }, { "epoch": 26.91, "eval_accuracy": 0.0, "eval_f1": 0.24858757062146897, "eval_loss": 0.6401556730270386, "eval_roc_auc": 0.644927536231884, "eval_runtime": 1.9831, "eval_samples_per_second": 21.179, "eval_steps_per_second": 1.513, "step": 37 }, { "epoch": 27.64, "eval_accuracy": 0.0, "eval_f1": 0.26857142857142857, "eval_loss": 0.6385589838027954, "eval_roc_auc": 0.666407867494824, "eval_runtime": 1.8248, "eval_samples_per_second": 23.016, "eval_steps_per_second": 1.644, "step": 38 }, { "epoch": 28.36, "eval_accuracy": 0.0, "eval_f1": 0.27624309392265195, "eval_loss": 0.6375865936279297, "eval_roc_auc": 0.6796066252587992, "eval_runtime": 2.0365, "eval_samples_per_second": 20.624, "eval_steps_per_second": 1.473, "step": 39 }, { "epoch": 29.82, "eval_accuracy": 0.0, "eval_f1": 0.2692307692307692, "eval_loss": 0.6347113847732544, "eval_roc_auc": 0.6721014492753624, "eval_runtime": 2.0248, "eval_samples_per_second": 20.743, "eval_steps_per_second": 1.482, "step": 41 }, { "epoch": 30.55, "eval_accuracy": 0.0, "eval_f1": 0.26553672316384186, "eval_loss": 0.6338767409324646, "eval_roc_auc": 0.6643374741200828, "eval_runtime": 1.912, "eval_samples_per_second": 21.966, "eval_steps_per_second": 1.569, "step": 42 }, { "epoch": 32.0, "eval_accuracy": 0.0, "eval_f1": 0.2674418604651163, "eval_loss": 0.6310274004936218, "eval_roc_auc": 0.6630434782608696, "eval_runtime": 2.048, "eval_samples_per_second": 20.508, "eval_steps_per_second": 1.465, "step": 44 }, { "epoch": 32.73, "eval_accuracy": 0.0, "eval_f1": 0.27893175074183973, "eval_loss": 0.630736768245697, "eval_roc_auc": 0.6731366459627329, "eval_runtime": 1.9873, "eval_samples_per_second": 21.134, "eval_steps_per_second": 1.51, "step": 45 }, { "epoch": 33.45, "eval_accuracy": 0.0, "eval_f1": 0.2713864306784661, "eval_loss": 0.6290633678436279, "eval_roc_auc": 0.6656314699792961, "eval_runtime": 1.9917, "eval_samples_per_second": 21.087, "eval_steps_per_second": 1.506, "step": 46 }, { "epoch": 34.91, "eval_accuracy": 0.0, "eval_f1": 0.2760736196319018, "eval_loss": 0.6271013617515564, "eval_roc_auc": 0.6658902691511386, "eval_runtime": 1.9904, "eval_samples_per_second": 21.101, "eval_steps_per_second": 1.507, "step": 48 }, { "epoch": 35.64, "eval_accuracy": 0.0, "eval_f1": 0.2686567164179105, "eval_loss": 0.6270779371261597, "eval_roc_auc": 0.661231884057971, "eval_runtime": 2.05, "eval_samples_per_second": 20.488, "eval_steps_per_second": 1.463, "step": 49 }, { "epoch": 36.36, "eval_accuracy": 0.0, "eval_f1": 0.2606060606060606, "eval_loss": 0.6277384757995605, "eval_roc_auc": 0.650879917184265, "eval_runtime": 1.8738, "eval_samples_per_second": 22.415, "eval_steps_per_second": 1.601, "step": 50 }, { "epoch": 37.82, "eval_accuracy": 0.0, "eval_f1": 0.2741433021806854, "eval_loss": 0.6256951689720154, "eval_roc_auc": 0.6620082815734989, "eval_runtime": 2.0555, "eval_samples_per_second": 20.433, "eval_steps_per_second": 1.459, "step": 52 }, { "epoch": 38.55, "eval_accuracy": 0.0, "eval_f1": 0.28923076923076924, "eval_loss": 0.624409556388855, "eval_roc_auc": 0.6793478260869565, "eval_runtime": 1.842, "eval_samples_per_second": 22.801, "eval_steps_per_second": 1.629, "step": 53 }, { "epoch": 40.0, "eval_accuracy": 0.0, "eval_f1": 0.29677419354838713, "eval_loss": 0.6203488111495972, "eval_roc_auc": 0.6806418219461698, "eval_runtime": 1.9945, "eval_samples_per_second": 21.058, "eval_steps_per_second": 1.504, "step": 55 }, { "epoch": 40.73, "eval_accuracy": 0.0, "eval_f1": 0.2902208201892744, "eval_loss": 0.6198378801345825, "eval_roc_auc": 0.6770186335403728, "eval_runtime": 1.9168, "eval_samples_per_second": 21.912, "eval_steps_per_second": 1.565, "step": 56 }, { "epoch": 41.45, "eval_accuracy": 0.0, "eval_f1": 0.3022508038585209, "eval_loss": 0.6183561682701111, "eval_roc_auc": 0.6865942028985508, "eval_runtime": 2.0474, "eval_samples_per_second": 20.514, "eval_steps_per_second": 1.465, "step": 57 }, { "epoch": 42.91, "eval_accuracy": 0.0, "eval_f1": 0.2977346278317152, "eval_loss": 0.6163293719291687, "eval_roc_auc": 0.6811594202898551, "eval_runtime": 2.0211, "eval_samples_per_second": 20.781, "eval_steps_per_second": 1.484, "step": 59 }, { "epoch": 43.64, "eval_accuracy": 0.0, "eval_f1": 0.33222591362126247, "eval_loss": 0.6147304177284241, "eval_roc_auc": 0.7111801242236025, "eval_runtime": 1.8612, "eval_samples_per_second": 22.566, "eval_steps_per_second": 1.612, "step": 60 }, { "epoch": 44.36, "eval_accuracy": 0.0, "eval_f1": 0.3197278911564626, "eval_loss": 0.6154341697692871, "eval_roc_auc": 0.6953933747412009, "eval_runtime": 2.1228, "eval_samples_per_second": 19.785, "eval_steps_per_second": 1.413, "step": 61 }, { "epoch": 45.82, "eval_accuracy": 0.0, "eval_f1": 0.30163934426229505, "eval_loss": 0.6129170060157776, "eval_roc_auc": 0.6832298136645963, "eval_runtime": 1.8919, "eval_samples_per_second": 22.2, "eval_steps_per_second": 1.586, "step": 63 }, { "epoch": 46.55, "eval_accuracy": 0.0, "eval_f1": 0.30201342281879195, "eval_loss": 0.6111928224563599, "eval_roc_auc": 0.680383022774327, "eval_runtime": 2.0579, "eval_samples_per_second": 20.409, "eval_steps_per_second": 1.458, "step": 64 }, { "epoch": 48.0, "eval_accuracy": 0.0, "eval_f1": 0.29605263157894735, "eval_loss": 0.60954749584198, "eval_roc_auc": 0.6772774327122153, "eval_runtime": 2.0077, "eval_samples_per_second": 20.92, "eval_steps_per_second": 1.494, "step": 66 }, { "epoch": 48.73, "eval_accuracy": 0.0, "eval_f1": 0.31333333333333335, "eval_loss": 0.6090860962867737, "eval_roc_auc": 0.692287784679089, "eval_runtime": 1.8446, "eval_samples_per_second": 22.769, "eval_steps_per_second": 1.626, "step": 67 }, { "epoch": 49.45, "eval_accuracy": 0.0, "eval_f1": 0.32653061224489793, "eval_loss": 0.6089531183242798, "eval_roc_auc": 0.7018633540372671, "eval_runtime": 2.0701, "eval_samples_per_second": 20.289, "eval_steps_per_second": 1.449, "step": 68 }, { "epoch": 50.91, "eval_accuracy": 0.0, "eval_f1": 0.30927835051546393, "eval_loss": 0.6077401638031006, "eval_roc_auc": 0.6840062111801242, "eval_runtime": 1.8396, "eval_samples_per_second": 22.832, "eval_steps_per_second": 1.631, "step": 70 }, { "epoch": 51.64, "eval_accuracy": 0.0, "eval_f1": 0.32394366197183105, "eval_loss": 0.6065036654472351, "eval_roc_auc": 0.6940993788819875, "eval_runtime": 2.0429, "eval_samples_per_second": 20.559, "eval_steps_per_second": 1.469, "step": 71 }, { "epoch": 52.36, "eval_accuracy": 0.0, "eval_f1": 0.32374100719424465, "eval_loss": 0.6057615876197815, "eval_roc_auc": 0.690734989648033, "eval_runtime": 1.8836, "eval_samples_per_second": 22.298, "eval_steps_per_second": 1.593, "step": 72 }, { "epoch": 53.82, "eval_accuracy": 0.0, "eval_f1": 0.3284671532846715, "eval_loss": 0.6027652621269226, "eval_roc_auc": 0.6928053830227744, "eval_runtime": 1.8924, "eval_samples_per_second": 22.194, "eval_steps_per_second": 1.585, "step": 74 }, { "epoch": 54.55, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3284671532846715, "eval_loss": 0.6037685871124268, "eval_roc_auc": 0.6928053830227744, "eval_runtime": 1.8574, "eval_samples_per_second": 22.612, "eval_steps_per_second": 1.615, "step": 75 }, { "epoch": 56.0, "eval_accuracy": 0.0, "eval_f1": 0.31970260223048325, "eval_loss": 0.6055669188499451, "eval_roc_auc": 0.6824534161490683, "eval_runtime": 2.0249, "eval_samples_per_second": 20.742, "eval_steps_per_second": 1.482, "step": 77 }, { "epoch": 56.73, "eval_accuracy": 0.0, "eval_f1": 0.3249097472924187, "eval_loss": 0.6073567867279053, "eval_roc_auc": 0.6912525879917184, "eval_runtime": 1.9844, "eval_samples_per_second": 21.165, "eval_steps_per_second": 1.512, "step": 78 }, { "epoch": 57.45, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3157894736842105, "eval_loss": 0.6030458807945251, "eval_roc_auc": 0.677536231884058, "eval_runtime": 1.8981, "eval_samples_per_second": 22.127, "eval_steps_per_second": 1.581, "step": 79 }, { "epoch": 58.91, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3358778625954198, "eval_loss": 0.6000563502311707, "eval_roc_auc": 0.6925465838509317, "eval_runtime": 2.137, "eval_samples_per_second": 19.653, "eval_steps_per_second": 1.404, "step": 81 }, { "epoch": 59.64, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3409090909090909, "eval_loss": 0.5992631316184998, "eval_roc_auc": 0.6979813664596273, "eval_runtime": 1.8122, "eval_samples_per_second": 23.177, "eval_steps_per_second": 1.655, "step": 82 }, { "epoch": 60.36, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.32592592592592595, "eval_loss": 0.6017413139343262, "eval_roc_auc": 0.6884057971014492, "eval_runtime": 2.0667, "eval_samples_per_second": 20.323, "eval_steps_per_second": 1.452, "step": 83 }, { "epoch": 61.82, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3146067415730337, "eval_loss": 0.6009005308151245, "eval_roc_auc": 0.6770186335403726, "eval_runtime": 1.9156, "eval_samples_per_second": 21.925, "eval_steps_per_second": 1.566, "step": 85 }, { "epoch": 62.55, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.31970260223048325, "eval_loss": 0.6017952561378479, "eval_roc_auc": 0.6824534161490683, "eval_runtime": 1.9734, "eval_samples_per_second": 21.283, "eval_steps_per_second": 1.52, "step": 86 }, { "epoch": 64.0, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3129770992366412, "eval_loss": 0.5975026488304138, "eval_roc_auc": 0.6731366459627329, "eval_runtime": 1.9304, "eval_samples_per_second": 21.757, "eval_steps_per_second": 1.554, "step": 88 }, { "epoch": 64.73, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3271375464684015, "eval_loss": 0.5978490710258484, "eval_roc_auc": 0.6889233954451346, "eval_runtime": 1.993, "eval_samples_per_second": 21.073, "eval_steps_per_second": 1.505, "step": 89 }, { "epoch": 65.45, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.34241245136186765, "eval_loss": 0.5966595411300659, "eval_roc_auc": 0.6951345755693582, "eval_runtime": 1.8441, "eval_samples_per_second": 22.775, "eval_steps_per_second": 1.627, "step": 90 }, { "epoch": 66.91, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3125, "eval_loss": 0.5973162055015564, "eval_roc_auc": 0.6697722567287785, "eval_runtime": 1.9347, "eval_samples_per_second": 21.708, "eval_steps_per_second": 1.551, "step": 92 }, { "epoch": 67.64, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3371647509578544, "eval_loss": 0.5955641865730286, "eval_roc_auc": 0.693064182194617, "eval_runtime": 1.9179, "eval_samples_per_second": 21.899, "eval_steps_per_second": 1.564, "step": 93 }, { "epoch": 68.36, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3372549019607843, "eval_loss": 0.5921858549118042, "eval_roc_auc": 0.6896997929606625, "eval_runtime": 1.9017, "eval_samples_per_second": 22.086, "eval_steps_per_second": 1.578, "step": 94 }, { "epoch": 69.82, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.33201581027667987, "eval_loss": 0.5948788523674011, "eval_roc_auc": 0.6842650103519669, "eval_runtime": 1.8776, "eval_samples_per_second": 22.369, "eval_steps_per_second": 1.598, "step": 96 }, { "epoch": 70.55, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3412698412698413, "eval_loss": 0.5959014892578125, "eval_roc_auc": 0.6912525879917184, "eval_runtime": 2.0178, "eval_samples_per_second": 20.814, "eval_steps_per_second": 1.487, "step": 97 }, { "epoch": 72.0, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3420074349442379, "eval_loss": 0.5944311022758484, "eval_roc_auc": 0.7018633540372671, "eval_runtime": 1.8838, "eval_samples_per_second": 22.295, "eval_steps_per_second": 1.593, "step": 99 }, { "epoch": 72.73, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3333333333333333, "eval_loss": 0.5955294370651245, "eval_roc_auc": 0.6881469979296065, "eval_runtime": 2.0716, "eval_samples_per_second": 20.275, "eval_steps_per_second": 1.448, "step": 100 }, { "epoch": 73.45, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3346303501945525, "eval_loss": 0.5932918190956116, "eval_roc_auc": 0.6886645962732919, "eval_runtime": 1.9689, "eval_samples_per_second": 21.332, "eval_steps_per_second": 1.524, "step": 101 }, { "epoch": 74.91, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3543307086614173, "eval_loss": 0.5894082188606262, "eval_roc_auc": 0.7031573498964803, "eval_runtime": 2.0135, "eval_samples_per_second": 20.859, "eval_steps_per_second": 1.49, "step": 103 }, { "epoch": 75.64, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.34241245136186765, "eval_loss": 0.5903118848800659, "eval_roc_auc": 0.6951345755693582, "eval_runtime": 1.8434, "eval_samples_per_second": 22.784, "eval_steps_per_second": 1.627, "step": 104 }, { "epoch": 76.36, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3410852713178295, "eval_loss": 0.5889719128608704, "eval_roc_auc": 0.694616977225673, "eval_runtime": 2.0369, "eval_samples_per_second": 20.62, "eval_steps_per_second": 1.473, "step": 105 }, { "epoch": 77.82, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3346303501945525, "eval_loss": 0.5922066569328308, "eval_roc_auc": 0.6886645962732919, "eval_runtime": 1.8672, "eval_samples_per_second": 22.493, "eval_steps_per_second": 1.607, "step": 107 }, { "epoch": 78.55, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.32432432432432434, "eval_loss": 0.5923347473144531, "eval_roc_auc": 0.6811594202898552, "eval_runtime": 2.0697, "eval_samples_per_second": 20.293, "eval_steps_per_second": 1.449, "step": 108 }, { "epoch": 80.0, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3467741935483871, "eval_loss": 0.590828537940979, "eval_roc_auc": 0.6933229813664595, "eval_runtime": 1.8922, "eval_samples_per_second": 22.196, "eval_steps_per_second": 1.585, "step": 110 }, { "epoch": 80.73, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.328, "eval_loss": 0.5922424793243408, "eval_roc_auc": 0.6793478260869565, "eval_runtime": 2.0683, "eval_samples_per_second": 20.307, "eval_steps_per_second": 1.45, "step": 111 }, { "epoch": 81.45, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.34400000000000003, "eval_loss": 0.5891572833061218, "eval_roc_auc": 0.692287784679089, "eval_runtime": 1.8345, "eval_samples_per_second": 22.894, "eval_steps_per_second": 1.635, "step": 112 }, { "epoch": 82.91, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.35059760956175307, "eval_loss": 0.5879591703414917, "eval_roc_auc": 0.69824016563147, "eval_runtime": 1.9744, "eval_samples_per_second": 21.272, "eval_steps_per_second": 1.519, "step": 114 }, { "epoch": 83.64, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.34538152610441764, "eval_loss": 0.5868695378303528, "eval_roc_auc": 0.6928053830227743, "eval_runtime": 1.943, "eval_samples_per_second": 21.616, "eval_steps_per_second": 1.544, "step": 115 }, { "epoch": 84.36, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3464566929133858, "eval_loss": 0.5840514302253723, "eval_roc_auc": 0.6966873706004141, "eval_runtime": 2.0388, "eval_samples_per_second": 20.6, "eval_steps_per_second": 1.471, "step": 116 }, { "epoch": 85.82, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.35684647302904565, "eval_loss": 0.5840616226196289, "eval_roc_auc": 0.6969461697722568, "eval_runtime": 1.9152, "eval_samples_per_second": 21.93, "eval_steps_per_second": 1.566, "step": 118 }, { "epoch": 86.55, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3495934959349593, "eval_loss": 0.5842622518539429, "eval_roc_auc": 0.6943581780538302, "eval_runtime": 2.0014, "eval_samples_per_second": 20.985, "eval_steps_per_second": 1.499, "step": 119 }, { "epoch": 88.0, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3598326359832636, "eval_loss": 0.5860231518745422, "eval_roc_auc": 0.6979813664596273, "eval_runtime": 1.7516, "eval_samples_per_second": 23.978, "eval_steps_per_second": 1.713, "step": 121 }, { "epoch": 88.73, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.34567901234567905, "eval_loss": 0.5837295055389404, "eval_roc_auc": 0.6894409937888197, "eval_runtime": 2.0716, "eval_samples_per_second": 20.275, "eval_steps_per_second": 1.448, "step": 122 }, { "epoch": 89.45, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3636363636363636, "eval_loss": 0.5826032161712646, "eval_roc_auc": 0.7028985507246376, "eval_runtime": 2.155, "eval_samples_per_second": 19.49, "eval_steps_per_second": 1.392, "step": 123 }, { "epoch": 90.91, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3651452282157676, "eval_loss": 0.5821616053581238, "eval_roc_auc": 0.7034161490683231, "eval_runtime": 1.8665, "eval_samples_per_second": 22.502, "eval_steps_per_second": 1.607, "step": 125 }, { "epoch": 91.64, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.36065573770491804, "eval_loss": 0.5813528299331665, "eval_roc_auc": 0.701863354037267, "eval_runtime": 2.0722, "eval_samples_per_second": 20.268, "eval_steps_per_second": 1.448, "step": 126 }, { "epoch": 92.36, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3629032258064516, "eval_loss": 0.5813586115837097, "eval_roc_auc": 0.7062629399585921, "eval_runtime": 1.8413, "eval_samples_per_second": 22.809, "eval_steps_per_second": 1.629, "step": 127 }, { "epoch": 93.82, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.37130801687763715, "eval_loss": 0.5817737579345703, "eval_roc_auc": 0.7054865424430642, "eval_runtime": 2.0383, "eval_samples_per_second": 20.605, "eval_steps_per_second": 1.472, "step": 129 }, { "epoch": 94.55, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3765690376569037, "eval_loss": 0.5802175402641296, "eval_roc_auc": 0.7109213250517598, "eval_runtime": 1.9338, "eval_samples_per_second": 21.718, "eval_steps_per_second": 1.551, "step": 130 }, { "epoch": 96.0, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.36752136752136755, "eval_loss": 0.5802630186080933, "eval_roc_auc": 0.7005693581780539, "eval_runtime": 1.9997, "eval_samples_per_second": 21.003, "eval_steps_per_second": 1.5, "step": 132 }, { "epoch": 96.73, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.351931330472103, "eval_loss": 0.5825139880180359, "eval_roc_auc": 0.6881469979296067, "eval_runtime": 2.0169, "eval_samples_per_second": 20.824, "eval_steps_per_second": 1.487, "step": 133 }, { "epoch": 97.45, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3628691983122363, "eval_loss": 0.5789888501167297, "eval_roc_auc": 0.6990165631469979, "eval_runtime": 2.0766, "eval_samples_per_second": 20.225, "eval_steps_per_second": 1.445, "step": 134 }, { "epoch": 98.91, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3765690376569037, "eval_loss": 0.5794755816459656, "eval_roc_auc": 0.7109213250517598, "eval_runtime": 1.8413, "eval_samples_per_second": 22.81, "eval_steps_per_second": 1.629, "step": 136 }, { "epoch": 99.64, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3697478991596639, "eval_loss": 0.5784409642219543, "eval_roc_auc": 0.7049689440993788, "eval_runtime": 2.0156, "eval_samples_per_second": 20.837, "eval_steps_per_second": 1.488, "step": 137 }, { "epoch": 100.36, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.35833333333333334, "eval_loss": 0.5818943977355957, "eval_roc_auc": 0.697463768115942, "eval_runtime": 1.8187, "eval_samples_per_second": 23.093, "eval_steps_per_second": 1.65, "step": 138 }, { "epoch": 101.82, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.35245901639344257, "eval_loss": 0.5833745002746582, "eval_roc_auc": 0.6953933747412008, "eval_runtime": 2.073, "eval_samples_per_second": 20.261, "eval_steps_per_second": 1.447, "step": 140 }, { "epoch": 102.55, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.3688524590163934, "eval_loss": 0.5825251340866089, "eval_roc_auc": 0.7083333333333333, "eval_runtime": 1.9912, "eval_samples_per_second": 21.093, "eval_steps_per_second": 1.507, "step": 141 }, { "epoch": 104.0, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3459915611814346, "eval_loss": 0.5839240550994873, "eval_roc_auc": 0.6860766045548654, "eval_runtime": 2.1002, "eval_samples_per_second": 19.998, "eval_steps_per_second": 1.428, "step": 143 }, { "epoch": 104.73, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3333333333333333, "eval_loss": 0.5838228464126587, "eval_roc_auc": 0.6814182194616977, "eval_runtime": 1.9156, "eval_samples_per_second": 21.926, "eval_steps_per_second": 1.566, "step": 144 }, { "epoch": 105.45, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.33870967741935487, "eval_loss": 0.580091655254364, "eval_roc_auc": 0.6868530020703933, "eval_runtime": 2.1494, "eval_samples_per_second": 19.541, "eval_steps_per_second": 1.396, "step": 145 }, { "epoch": 106.91, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.35146443514644354, "eval_loss": 0.581135630607605, "eval_roc_auc": 0.6915113871635612, "eval_runtime": 1.8396, "eval_samples_per_second": 22.831, "eval_steps_per_second": 1.631, "step": 147 }, { "epoch": 107.64, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3374485596707819, "eval_loss": 0.5792709589004517, "eval_roc_auc": 0.6829710144927537, "eval_runtime": 2.1328, "eval_samples_per_second": 19.693, "eval_steps_per_second": 1.407, "step": 148 }, { "epoch": 108.36, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3448275862068966, "eval_loss": 0.5765911936759949, "eval_roc_auc": 0.6821946169772257, "eval_runtime": 2.0548, "eval_samples_per_second": 20.44, "eval_steps_per_second": 1.46, "step": 149 }, { "epoch": 109.82, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.34453781512605036, "eval_loss": 0.5759981870651245, "eval_roc_auc": 0.6855590062111802, "eval_runtime": 2.1017, "eval_samples_per_second": 19.984, "eval_steps_per_second": 1.427, "step": 151 }, { "epoch": 110.55, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3559322033898305, "eval_loss": 0.5757153034210205, "eval_roc_auc": 0.693064182194617, "eval_runtime": 1.8256, "eval_samples_per_second": 23.006, "eval_steps_per_second": 1.643, "step": 152 }, { "epoch": 112.0, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3474576271186441, "eval_loss": 0.5759687423706055, "eval_roc_auc": 0.6865942028985509, "eval_runtime": 1.998, "eval_samples_per_second": 21.021, "eval_steps_per_second": 1.502, "step": 154 }, { "epoch": 112.73, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3628691983122363, "eval_loss": 0.5742767453193665, "eval_roc_auc": 0.6990165631469979, "eval_runtime": 2.0687, "eval_samples_per_second": 20.303, "eval_steps_per_second": 1.45, "step": 155 }, { "epoch": 113.45, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3636363636363636, "eval_loss": 0.5731971263885498, "eval_roc_auc": 0.7028985507246376, "eval_runtime": 1.9431, "eval_samples_per_second": 21.615, "eval_steps_per_second": 1.544, "step": 156 }, { "epoch": 114.91, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.37860082304526754, "eval_loss": 0.5735821723937988, "eval_roc_auc": 0.7153209109730849, "eval_runtime": 2.067, "eval_samples_per_second": 20.32, "eval_steps_per_second": 1.451, "step": 158 }, { "epoch": 115.64, "eval_accuracy": 0.023809523809523808, "eval_f1": 0.36666666666666664, "eval_loss": 0.5763630867004395, "eval_roc_auc": 0.7039337474120083, "eval_runtime": 1.876, "eval_samples_per_second": 22.388, "eval_steps_per_second": 1.599, "step": 159 }, { "epoch": 116.36, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.361344537815126, "eval_loss": 0.5764896273612976, "eval_roc_auc": 0.6984989648033126, "eval_runtime": 2.186, "eval_samples_per_second": 19.213, "eval_steps_per_second": 1.372, "step": 160 }, { "epoch": 117.82, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.35744680851063826, "eval_loss": 0.5749201774597168, "eval_roc_auc": 0.6935817805383023, "eval_runtime": 1.8855, "eval_samples_per_second": 22.276, "eval_steps_per_second": 1.591, "step": 162 }, { "epoch": 118.55, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3591836734693878, "eval_loss": 0.5753706693649292, "eval_roc_auc": 0.7013457556935817, "eval_runtime": 2.0351, "eval_samples_per_second": 20.637, "eval_steps_per_second": 1.474, "step": 163 }, { "epoch": 120.0, "eval_accuracy": 0.047619047619047616, "eval_f1": 0.3665338645418327, "eval_loss": 0.5756567120552063, "eval_roc_auc": 0.7111801242236024, "eval_runtime": 1.777, "eval_samples_per_second": 23.636, "eval_steps_per_second": 1.688, "step": 165 }, { "epoch": 120.73, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3728813559322034, "eval_loss": 0.5771237015724182, "eval_roc_auc": 0.7060041407867494, "eval_runtime": 2.0719, "eval_samples_per_second": 20.271, "eval_steps_per_second": 1.448, "step": 166 }, { "epoch": 121.45, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3628691983122363, "eval_loss": 0.5745561122894287, "eval_roc_auc": 0.6990165631469979, "eval_runtime": 1.8367, "eval_samples_per_second": 22.867, "eval_steps_per_second": 1.633, "step": 167 }, { "epoch": 122.91, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.36440677966101687, "eval_loss": 0.5757673382759094, "eval_roc_auc": 0.6995341614906831, "eval_runtime": 2.032, "eval_samples_per_second": 20.669, "eval_steps_per_second": 1.476, "step": 169 }, { "epoch": 123.64, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3559322033898305, "eval_loss": 0.5745112299919128, "eval_roc_auc": 0.693064182194617, "eval_runtime": 1.8329, "eval_samples_per_second": 22.914, "eval_steps_per_second": 1.637, "step": 170 }, { "epoch": 124.36, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.35443037974683544, "eval_loss": 0.5758460164070129, "eval_roc_auc": 0.6925465838509317, "eval_runtime": 2.0956, "eval_samples_per_second": 20.042, "eval_steps_per_second": 1.432, "step": 171 }, { "epoch": 125.82, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3598326359832636, "eval_loss": 0.5759280323982239, "eval_roc_auc": 0.6979813664596273, "eval_runtime": 1.9931, "eval_samples_per_second": 21.072, "eval_steps_per_second": 1.505, "step": 173 }, { "epoch": 126.55, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.35684647302904565, "eval_loss": 0.5771880149841309, "eval_roc_auc": 0.6969461697722568, "eval_runtime": 1.9762, "eval_samples_per_second": 21.253, "eval_steps_per_second": 1.518, "step": 174 }, { "epoch": 128.0, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.35833333333333334, "eval_loss": 0.5747218132019043, "eval_roc_auc": 0.697463768115942, "eval_runtime": 2.0367, "eval_samples_per_second": 20.622, "eval_steps_per_second": 1.473, "step": 176 }, { "epoch": 128.73, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.36440677966101687, "eval_loss": 0.5737968683242798, "eval_roc_auc": 0.6995341614906831, "eval_runtime": 1.802, "eval_samples_per_second": 23.307, "eval_steps_per_second": 1.665, "step": 177 }, { "epoch": 129.45, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.36440677966101687, "eval_loss": 0.575109601020813, "eval_roc_auc": 0.6995341614906831, "eval_runtime": 2.0006, "eval_samples_per_second": 20.993, "eval_steps_per_second": 1.5, "step": 178 }, { "epoch": 130.91, "eval_accuracy": 0.09523809523809523, "eval_f1": 0.37130801687763715, "eval_loss": 0.5740981101989746, "eval_roc_auc": 0.7054865424430642, "eval_runtime": 1.7241, "eval_samples_per_second": 24.361, "eval_steps_per_second": 1.74, "step": 180 }, { "epoch": 131.64, "eval_accuracy": 0.09523809523809523, "eval_f1": 0.37130801687763715, "eval_loss": 0.5748480558395386, "eval_roc_auc": 0.7054865424430642, "eval_runtime": 2.2478, "eval_samples_per_second": 18.685, "eval_steps_per_second": 1.335, "step": 181 }, { "epoch": 132.36, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3659574468085106, "eval_loss": 0.5767146944999695, "eval_roc_auc": 0.7000517598343685, "eval_runtime": 1.9197, "eval_samples_per_second": 21.879, "eval_steps_per_second": 1.563, "step": 182 }, { "epoch": 133.82, "eval_accuracy": 0.09523809523809523, "eval_f1": 0.3659574468085106, "eval_loss": 0.5731571316719055, "eval_roc_auc": 0.7000517598343685, "eval_runtime": 1.8071, "eval_samples_per_second": 23.241, "eval_steps_per_second": 1.66, "step": 184 }, { "epoch": 134.55, "eval_accuracy": 0.09523809523809523, "eval_f1": 0.3771929824561403, "eval_loss": 0.5742261409759521, "eval_roc_auc": 0.7036749482401656, "eval_runtime": 2.2015, "eval_samples_per_second": 19.078, "eval_steps_per_second": 1.363, "step": 185 }, { "epoch": 136.0, "eval_accuracy": 0.09523809523809523, "eval_f1": 0.37554585152838427, "eval_loss": 0.5690290927886963, "eval_roc_auc": 0.7031573498964804, "eval_runtime": 2.2207, "eval_samples_per_second": 18.913, "eval_steps_per_second": 1.351, "step": 187 }, { "epoch": 136.73, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3805309734513274, "eval_loss": 0.5698773264884949, "eval_roc_auc": 0.7047101449275363, "eval_runtime": 2.491, "eval_samples_per_second": 16.861, "eval_steps_per_second": 1.204, "step": 188 }, { "epoch": 137.45, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.37068965517241376, "eval_loss": 0.5743153095245361, "eval_roc_auc": 0.7016045548654244, "eval_runtime": 2.2065, "eval_samples_per_second": 19.034, "eval_steps_per_second": 1.36, "step": 189 }, { "epoch": 138.91, "eval_accuracy": 0.09523809523809523, "eval_f1": 0.3529411764705882, "eval_loss": 0.5739556550979614, "eval_roc_auc": 0.6920289855072465, "eval_runtime": 2.1255, "eval_samples_per_second": 19.76, "eval_steps_per_second": 1.411, "step": 191 }, { "epoch": 139.64, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3659574468085106, "eval_loss": 0.5739744901657104, "eval_roc_auc": 0.7000517598343685, "eval_runtime": 2.0832, "eval_samples_per_second": 20.161, "eval_steps_per_second": 1.44, "step": 192 }, { "epoch": 140.36, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.36440677966101687, "eval_loss": 0.5733990669250488, "eval_roc_auc": 0.6995341614906831, "eval_runtime": 2.021, "eval_samples_per_second": 20.782, "eval_steps_per_second": 1.484, "step": 193 }, { "epoch": 141.82, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.36752136752136755, "eval_loss": 0.5739865303039551, "eval_roc_auc": 0.7005693581780539, "eval_runtime": 2.0466, "eval_samples_per_second": 20.522, "eval_steps_per_second": 1.466, "step": 195 }, { "epoch": 142.55, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.37068965517241376, "eval_loss": 0.5721157789230347, "eval_roc_auc": 0.7016045548654244, "eval_runtime": 1.8265, "eval_samples_per_second": 22.994, "eval_steps_per_second": 1.642, "step": 196 }, { "epoch": 144.0, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3766816143497758, "eval_loss": 0.5724892020225525, "eval_roc_auc": 0.6997929606625258, "eval_runtime": 2.0667, "eval_samples_per_second": 20.323, "eval_steps_per_second": 1.452, "step": 198 }, { "epoch": 144.73, "eval_accuracy": 0.09523809523809523, "eval_f1": 0.3728813559322034, "eval_loss": 0.5734347105026245, "eval_roc_auc": 0.7060041407867494, "eval_runtime": 1.798, "eval_samples_per_second": 23.359, "eval_steps_per_second": 1.669, "step": 199 }, { "epoch": 145.45, "eval_accuracy": 0.07142857142857142, "eval_f1": 0.3628691983122363, "eval_loss": 0.575474202632904, "eval_roc_auc": 0.6990165631469979, "eval_runtime": 2.2459, "eval_samples_per_second": 18.701, "eval_steps_per_second": 1.336, "step": 200 }, { "epoch": 145.45, "step": 200, "total_flos": 1.357171875053568e+17, "train_loss": 0.5662997841835022, "train_runtime": 1746.9239, "train_samples_per_second": 19.005, "train_steps_per_second": 0.114 } ], "logging_steps": 500, "max_steps": 200, "num_train_epochs": 200, "save_steps": 500, "total_flos": 1.357171875053568e+17, "trial_name": null, "trial_params": null }