|
{ |
|
"best_metric": 0.9491525423728814, |
|
"best_model_checkpoint": "beit-base-patch16-224/checkpoint-51", |
|
"epoch": 42.35294117647059, |
|
"eval_steps": 500, |
|
"global_step": 180, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.9411764705882353, |
|
"eval_accuracy": 0.864406779661017, |
|
"eval_f1_score": 0.8151914626490897, |
|
"eval_loss": 0.35985592007637024, |
|
"eval_precision": 0.8831092928112214, |
|
"eval_recall": 0.864406779661017, |
|
"eval_runtime": 0.994, |
|
"eval_samples_per_second": 59.356, |
|
"eval_steps_per_second": 2.012, |
|
"step": 4 |
|
}, |
|
{ |
|
"epoch": 1.8823529411764706, |
|
"eval_accuracy": 0.8983050847457628, |
|
"eval_f1_score": 0.8983050847457628, |
|
"eval_loss": 0.2752338945865631, |
|
"eval_precision": 0.8983050847457628, |
|
"eval_recall": 0.8983050847457628, |
|
"eval_runtime": 1.1891, |
|
"eval_samples_per_second": 49.617, |
|
"eval_steps_per_second": 1.682, |
|
"step": 8 |
|
}, |
|
{ |
|
"epoch": 2.8235294117647056, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9286307743436357, |
|
"eval_loss": 0.17347723245620728, |
|
"eval_precision": 0.9293164462655988, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.0218, |
|
"eval_samples_per_second": 57.739, |
|
"eval_steps_per_second": 1.957, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 3.5294117647058822, |
|
"grad_norm": 5.715649604797363, |
|
"learning_rate": 4.166666666666667e-05, |
|
"loss": 0.2978, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9199970045680336, |
|
"eval_loss": 0.17451411485671997, |
|
"eval_precision": 0.9311215290299315, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.228, |
|
"eval_samples_per_second": 48.047, |
|
"eval_steps_per_second": 1.629, |
|
"step": 17 |
|
}, |
|
{ |
|
"epoch": 4.9411764705882355, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9170563800358625, |
|
"eval_loss": 0.1887725591659546, |
|
"eval_precision": 0.9196471809062606, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.0748, |
|
"eval_samples_per_second": 54.895, |
|
"eval_steps_per_second": 1.861, |
|
"step": 21 |
|
}, |
|
{ |
|
"epoch": 5.882352941176471, |
|
"eval_accuracy": 0.8983050847457628, |
|
"eval_f1_score": 0.9023521272915945, |
|
"eval_loss": 0.2818872034549713, |
|
"eval_precision": 0.9092193117616847, |
|
"eval_recall": 0.8983050847457628, |
|
"eval_runtime": 1.2817, |
|
"eval_samples_per_second": 46.032, |
|
"eval_steps_per_second": 1.56, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 6.823529411764706, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.900974731483206, |
|
"eval_loss": 0.5331762433052063, |
|
"eval_precision": 0.9229583975346687, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.1367, |
|
"eval_samples_per_second": 51.907, |
|
"eval_steps_per_second": 1.76, |
|
"step": 29 |
|
}, |
|
{ |
|
"epoch": 7.0588235294117645, |
|
"grad_norm": 3.518982410430908, |
|
"learning_rate": 4.62962962962963e-05, |
|
"loss": 0.0283, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9199970045680336, |
|
"eval_loss": 0.5418176054954529, |
|
"eval_precision": 0.9311215290299315, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.0994, |
|
"eval_samples_per_second": 53.664, |
|
"eval_steps_per_second": 1.819, |
|
"step": 34 |
|
}, |
|
{ |
|
"epoch": 8.941176470588236, |
|
"eval_accuracy": 0.8983050847457628, |
|
"eval_f1_score": 0.8757595139110971, |
|
"eval_loss": 0.6493940353393555, |
|
"eval_precision": 0.9092009685230025, |
|
"eval_recall": 0.8983050847457628, |
|
"eval_runtime": 1.1076, |
|
"eval_samples_per_second": 53.266, |
|
"eval_steps_per_second": 1.806, |
|
"step": 38 |
|
}, |
|
{ |
|
"epoch": 9.882352941176471, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9222355815847652, |
|
"eval_loss": 0.5614629983901978, |
|
"eval_precision": 0.9455205811138014, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.107, |
|
"eval_samples_per_second": 53.298, |
|
"eval_steps_per_second": 1.807, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 10.588235294117647, |
|
"grad_norm": 0.022936690598726273, |
|
"learning_rate": 4.166666666666667e-05, |
|
"loss": 0.0061, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 10.823529411764707, |
|
"eval_accuracy": 0.8983050847457628, |
|
"eval_f1_score": 0.8857329111566401, |
|
"eval_loss": 0.8766900897026062, |
|
"eval_precision": 0.8910232266164471, |
|
"eval_recall": 0.8983050847457628, |
|
"eval_runtime": 1.0968, |
|
"eval_samples_per_second": 53.791, |
|
"eval_steps_per_second": 1.823, |
|
"step": 46 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.9519982027408203, |
|
"eval_loss": 0.3859255313873291, |
|
"eval_precision": 0.961864406779661, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.1019, |
|
"eval_samples_per_second": 53.546, |
|
"eval_steps_per_second": 1.815, |
|
"step": 51 |
|
}, |
|
{ |
|
"epoch": 12.941176470588236, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9322033898305084, |
|
"eval_loss": 0.4550356864929199, |
|
"eval_precision": 0.9322033898305084, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.1103, |
|
"eval_samples_per_second": 53.137, |
|
"eval_steps_per_second": 1.801, |
|
"step": 55 |
|
}, |
|
{ |
|
"epoch": 13.882352941176471, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.947908749000523, |
|
"eval_loss": 0.4313892722129822, |
|
"eval_precision": 0.9476985709538053, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.1142, |
|
"eval_samples_per_second": 52.955, |
|
"eval_steps_per_second": 1.795, |
|
"step": 59 |
|
}, |
|
{ |
|
"epoch": 14.117647058823529, |
|
"grad_norm": 5.196343898773193, |
|
"learning_rate": 3.7037037037037037e-05, |
|
"loss": 0.01, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 14.823529411764707, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.9519982027408203, |
|
"eval_loss": 0.41266247630119324, |
|
"eval_precision": 0.961864406779661, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.1128, |
|
"eval_samples_per_second": 53.019, |
|
"eval_steps_per_second": 1.797, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.947908749000523, |
|
"eval_loss": 0.3284989297389984, |
|
"eval_precision": 0.9476985709538053, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.1075, |
|
"eval_samples_per_second": 53.271, |
|
"eval_steps_per_second": 1.806, |
|
"step": 68 |
|
}, |
|
{ |
|
"epoch": 16.941176470588236, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.947908749000523, |
|
"eval_loss": 0.3179616332054138, |
|
"eval_precision": 0.9476985709538053, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.0963, |
|
"eval_samples_per_second": 53.819, |
|
"eval_steps_per_second": 1.824, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 17.647058823529413, |
|
"grad_norm": 5.957318305969238, |
|
"learning_rate": 3.240740740740741e-05, |
|
"loss": 0.0076, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 17.88235294117647, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9286307743436357, |
|
"eval_loss": 0.44822579622268677, |
|
"eval_precision": 0.9293164462655988, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.1817, |
|
"eval_samples_per_second": 49.929, |
|
"eval_steps_per_second": 1.693, |
|
"step": 76 |
|
}, |
|
{ |
|
"epoch": 18.823529411764707, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9322033898305084, |
|
"eval_loss": 0.44370484352111816, |
|
"eval_precision": 0.9322033898305084, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.1079, |
|
"eval_samples_per_second": 53.253, |
|
"eval_steps_per_second": 1.805, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9322033898305084, |
|
"eval_loss": 0.4818989932537079, |
|
"eval_precision": 0.9322033898305084, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.3186, |
|
"eval_samples_per_second": 44.744, |
|
"eval_steps_per_second": 1.517, |
|
"step": 85 |
|
}, |
|
{ |
|
"epoch": 20.941176470588236, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9286307743436357, |
|
"eval_loss": 0.5132895112037659, |
|
"eval_precision": 0.9293164462655988, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.1055, |
|
"eval_samples_per_second": 53.367, |
|
"eval_steps_per_second": 1.809, |
|
"step": 89 |
|
}, |
|
{ |
|
"epoch": 21.176470588235293, |
|
"grad_norm": 0.27098149061203003, |
|
"learning_rate": 2.777777777777778e-05, |
|
"loss": 0.0003, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 21.88235294117647, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.947908749000523, |
|
"eval_loss": 0.45395800471305847, |
|
"eval_precision": 0.9476985709538053, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.1075, |
|
"eval_samples_per_second": 53.275, |
|
"eval_steps_per_second": 1.806, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 22.823529411764707, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9170563800358625, |
|
"eval_loss": 0.38566043972969055, |
|
"eval_precision": 0.9196471809062606, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.0947, |
|
"eval_samples_per_second": 53.897, |
|
"eval_steps_per_second": 1.827, |
|
"step": 97 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.8983050847457628, |
|
"eval_f1_score": 0.9023521272915945, |
|
"eval_loss": 0.4077180027961731, |
|
"eval_precision": 0.9092193117616847, |
|
"eval_recall": 0.8983050847457628, |
|
"eval_runtime": 1.1092, |
|
"eval_samples_per_second": 53.192, |
|
"eval_steps_per_second": 1.803, |
|
"step": 102 |
|
}, |
|
{ |
|
"epoch": 24.705882352941178, |
|
"grad_norm": 0.018473587930202484, |
|
"learning_rate": 2.314814814814815e-05, |
|
"loss": 0.0028, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 24.941176470588236, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.947908749000523, |
|
"eval_loss": 0.3955690562725067, |
|
"eval_precision": 0.9476985709538053, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.2914, |
|
"eval_samples_per_second": 45.688, |
|
"eval_steps_per_second": 1.549, |
|
"step": 106 |
|
}, |
|
{ |
|
"epoch": 25.88235294117647, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9286307743436357, |
|
"eval_loss": 0.4670986831188202, |
|
"eval_precision": 0.9293164462655988, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.1219, |
|
"eval_samples_per_second": 52.592, |
|
"eval_steps_per_second": 1.783, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 26.823529411764707, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9322033898305084, |
|
"eval_loss": 0.3811493515968323, |
|
"eval_precision": 0.9322033898305084, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.2582, |
|
"eval_samples_per_second": 46.893, |
|
"eval_steps_per_second": 1.59, |
|
"step": 114 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9322033898305084, |
|
"eval_loss": 0.3700270354747772, |
|
"eval_precision": 0.9322033898305084, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.1041, |
|
"eval_samples_per_second": 53.436, |
|
"eval_steps_per_second": 1.811, |
|
"step": 119 |
|
}, |
|
{ |
|
"epoch": 28.235294117647058, |
|
"grad_norm": 0.08375111222267151, |
|
"learning_rate": 1.8518518518518518e-05, |
|
"loss": 0.0006, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 28.941176470588236, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9322033898305084, |
|
"eval_loss": 0.40281012654304504, |
|
"eval_precision": 0.9322033898305084, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.1715, |
|
"eval_samples_per_second": 50.362, |
|
"eval_steps_per_second": 1.707, |
|
"step": 123 |
|
}, |
|
{ |
|
"epoch": 29.88235294117647, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9080138226098403, |
|
"eval_loss": 0.6924118995666504, |
|
"eval_precision": 0.9106172049888072, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.1072, |
|
"eval_samples_per_second": 53.287, |
|
"eval_steps_per_second": 1.806, |
|
"step": 127 |
|
}, |
|
{ |
|
"epoch": 30.823529411764707, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9080138226098403, |
|
"eval_loss": 0.6948609948158264, |
|
"eval_precision": 0.9106172049888072, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.1092, |
|
"eval_samples_per_second": 53.191, |
|
"eval_steps_per_second": 1.803, |
|
"step": 131 |
|
}, |
|
{ |
|
"epoch": 31.764705882352942, |
|
"grad_norm": 0.0031740041449666023, |
|
"learning_rate": 1.388888888888889e-05, |
|
"loss": 0.0033, |
|
"step": 135 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9131812483342053, |
|
"eval_loss": 0.5888532996177673, |
|
"eval_precision": 0.912013958125623, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.1154, |
|
"eval_samples_per_second": 52.896, |
|
"eval_steps_per_second": 1.793, |
|
"step": 136 |
|
}, |
|
{ |
|
"epoch": 32.94117647058823, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9322033898305084, |
|
"eval_loss": 0.5128433108329773, |
|
"eval_precision": 0.9322033898305084, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.0996, |
|
"eval_samples_per_second": 53.657, |
|
"eval_steps_per_second": 1.819, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 33.88235294117647, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.9502338280215176, |
|
"eval_loss": 0.44105064868927, |
|
"eval_precision": 0.9521964718090626, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.3012, |
|
"eval_samples_per_second": 45.342, |
|
"eval_steps_per_second": 1.537, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 34.8235294117647, |
|
"eval_accuracy": 0.9491525423728814, |
|
"eval_f1_score": 0.9502338280215176, |
|
"eval_loss": 0.4420201778411865, |
|
"eval_precision": 0.9521964718090626, |
|
"eval_recall": 0.9491525423728814, |
|
"eval_runtime": 1.1093, |
|
"eval_samples_per_second": 53.188, |
|
"eval_steps_per_second": 1.803, |
|
"step": 148 |
|
}, |
|
{ |
|
"epoch": 35.294117647058826, |
|
"grad_norm": 0.0013447869569063187, |
|
"learning_rate": 9.259259259259259e-06, |
|
"loss": 0.0013, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_accuracy": 0.9322033898305084, |
|
"eval_f1_score": 0.9322033898305084, |
|
"eval_loss": 0.5615989565849304, |
|
"eval_precision": 0.9322033898305084, |
|
"eval_recall": 0.9322033898305084, |
|
"eval_runtime": 1.1347, |
|
"eval_samples_per_second": 51.997, |
|
"eval_steps_per_second": 1.763, |
|
"step": 153 |
|
}, |
|
{ |
|
"epoch": 36.94117647058823, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9131812483342053, |
|
"eval_loss": 0.6365456581115723, |
|
"eval_precision": 0.912013958125623, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.0934, |
|
"eval_samples_per_second": 53.961, |
|
"eval_steps_per_second": 1.829, |
|
"step": 157 |
|
}, |
|
{ |
|
"epoch": 37.88235294117647, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9131812483342053, |
|
"eval_loss": 0.6694910526275635, |
|
"eval_precision": 0.912013958125623, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.0997, |
|
"eval_samples_per_second": 53.65, |
|
"eval_steps_per_second": 1.819, |
|
"step": 161 |
|
}, |
|
{ |
|
"epoch": 38.8235294117647, |
|
"grad_norm": 0.0024713820312172174, |
|
"learning_rate": 4.6296296296296296e-06, |
|
"loss": 0.0001, |
|
"step": 165 |
|
}, |
|
{ |
|
"epoch": 38.8235294117647, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9131812483342053, |
|
"eval_loss": 0.6845612525939941, |
|
"eval_precision": 0.912013958125623, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.1919, |
|
"eval_samples_per_second": 49.501, |
|
"eval_steps_per_second": 1.678, |
|
"step": 165 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9131812483342053, |
|
"eval_loss": 0.6930243968963623, |
|
"eval_precision": 0.912013958125623, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.1022, |
|
"eval_samples_per_second": 53.53, |
|
"eval_steps_per_second": 1.815, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 40.94117647058823, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9131812483342053, |
|
"eval_loss": 0.6957547068595886, |
|
"eval_precision": 0.912013958125623, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.1025, |
|
"eval_samples_per_second": 53.515, |
|
"eval_steps_per_second": 1.814, |
|
"step": 174 |
|
}, |
|
{ |
|
"epoch": 41.88235294117647, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9131812483342053, |
|
"eval_loss": 0.6966932415962219, |
|
"eval_precision": 0.912013958125623, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.0997, |
|
"eval_samples_per_second": 53.649, |
|
"eval_steps_per_second": 1.819, |
|
"step": 178 |
|
}, |
|
{ |
|
"epoch": 42.35294117647059, |
|
"grad_norm": 0.0012529775267466903, |
|
"learning_rate": 0.0, |
|
"loss": 0.0044, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 42.35294117647059, |
|
"eval_accuracy": 0.9152542372881356, |
|
"eval_f1_score": 0.9131812483342053, |
|
"eval_loss": 0.6952070593833923, |
|
"eval_precision": 0.912013958125623, |
|
"eval_recall": 0.9152542372881356, |
|
"eval_runtime": 1.142, |
|
"eval_samples_per_second": 51.664, |
|
"eval_steps_per_second": 1.751, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 42.35294117647059, |
|
"step": 180, |
|
"total_flos": 1.7260934287224177e+18, |
|
"train_loss": 0.030212831471969064, |
|
"train_runtime": 1290.1323, |
|
"train_samples_per_second": 18.347, |
|
"train_steps_per_second": 0.14 |
|
}, |
|
{ |
|
"epoch": 42.35294117647059, |
|
"eval_accuracy": 0.9387755102040817, |
|
"eval_f1_score": 0.9412065766745571, |
|
"eval_loss": 0.3751787841320038, |
|
"eval_precision": 0.9451036228444866, |
|
"eval_recall": 0.9387755102040817, |
|
"eval_runtime": 3.0643, |
|
"eval_samples_per_second": 47.972, |
|
"eval_steps_per_second": 1.632, |
|
"step": 180 |
|
} |
|
], |
|
"logging_steps": 15, |
|
"max_steps": 180, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 45, |
|
"save_steps": 500, |
|
"total_flos": 1.7260934287224177e+18, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|