{ "best_metric": 0.6452859350850078, "best_model_checkpoint": "resnet-50-FV2-finetuned-memes/checkpoint-400", "epoch": 19.987654320987655, "global_step": 400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.49, "learning_rate": 3e-05, "loss": 1.5967, "step": 10 }, { "epoch": 0.99, "learning_rate": 6e-05, "loss": 1.5763, "step": 20 }, { "epoch": 0.99, "eval_accuracy": 0.4281298299845441, "eval_f1": 0.26687554630409566, "eval_loss": 1.5574817657470703, "eval_precision": 0.29655663588874154, "eval_recall": 0.4281298299845441, "eval_runtime": 11.3953, "eval_samples_per_second": 113.556, "eval_steps_per_second": 1.843, "step": 20 }, { "epoch": 1.49, "learning_rate": 9e-05, "loss": 1.5775, "step": 30 }, { "epoch": 1.99, "learning_rate": 0.00012, "loss": 1.4761, "step": 40 }, { "epoch": 1.99, "eval_accuracy": 0.43431221020092736, "eval_f1": 0.2630209721259926, "eval_loss": 1.4423725605010986, "eval_precision": 0.18862709592961452, "eval_recall": 0.43431221020092736, "eval_runtime": 10.1591, "eval_samples_per_second": 127.373, "eval_steps_per_second": 2.067, "step": 40 }, { "epoch": 2.49, "learning_rate": 0.00011666666666666667, "loss": 1.444, "step": 50 }, { "epoch": 2.99, "learning_rate": 0.00011333333333333333, "loss": 1.3563, "step": 60 }, { "epoch": 2.99, "eval_accuracy": 0.43431221020092736, "eval_f1": 0.2630209721259926, "eval_loss": 1.3240060806274414, "eval_precision": 0.18862709592961452, "eval_recall": 0.43431221020092736, "eval_runtime": 10.039, "eval_samples_per_second": 128.897, "eval_steps_per_second": 2.092, "step": 60 }, { "epoch": 3.49, "learning_rate": 0.00011, "loss": 1.3356, "step": 70 }, { "epoch": 3.99, "learning_rate": 0.00010666666666666667, "loss": 1.2824, "step": 80 }, { "epoch": 3.99, "eval_accuracy": 0.43894899536321486, "eval_f1": 0.27337332937410136, "eval_loss": 1.263592004776001, "eval_precision": 0.3097252114961456, "eval_recall": 0.43894899536321486, "eval_runtime": 10.0514, "eval_samples_per_second": 128.739, "eval_steps_per_second": 2.089, "step": 80 }, { "epoch": 4.49, "learning_rate": 0.00010333333333333334, "loss": 1.2695, "step": 90 }, { "epoch": 4.99, "learning_rate": 0.0001, "loss": 1.2315, "step": 100 }, { "epoch": 4.99, "eval_accuracy": 0.4528593508500773, "eval_f1": 0.30415713999389604, "eval_loss": 1.2118711471557617, "eval_precision": 0.3235903479528001, "eval_recall": 0.4528593508500773, "eval_runtime": 10.1242, "eval_samples_per_second": 127.813, "eval_steps_per_second": 2.074, "step": 100 }, { "epoch": 5.49, "learning_rate": 9.666666666666667e-05, "loss": 1.2096, "step": 110 }, { "epoch": 5.99, "learning_rate": 9.333333333333334e-05, "loss": 1.1956, "step": 120 }, { "epoch": 5.99, "eval_accuracy": 0.4899536321483771, "eval_f1": 0.3692247614974613, "eval_loss": 1.1763864755630493, "eval_precision": 0.3730719437429542, "eval_recall": 0.4899536321483771, "eval_runtime": 10.0285, "eval_samples_per_second": 129.033, "eval_steps_per_second": 2.094, "step": 120 }, { "epoch": 6.49, "learning_rate": 9e-05, "loss": 1.1727, "step": 130 }, { "epoch": 6.99, "learning_rate": 8.666666666666667e-05, "loss": 1.1452, "step": 140 }, { "epoch": 6.99, "eval_accuracy": 0.5146831530139103, "eval_f1": 0.4090229013083186, "eval_loss": 1.1424295902252197, "eval_precision": 0.396316505367188, "eval_recall": 0.5146831530139103, "eval_runtime": 11.1, "eval_samples_per_second": 116.577, "eval_steps_per_second": 1.892, "step": 140 }, { "epoch": 7.49, "learning_rate": 8.333333333333333e-05, "loss": 1.1455, "step": 150 }, { "epoch": 7.99, "learning_rate": 7.999999999999999e-05, "loss": 1.1076, "step": 160 }, { "epoch": 7.99, "eval_accuracy": 0.5370942812982998, "eval_f1": 0.4392356918841944, "eval_loss": 1.1189799308776855, "eval_precision": 0.41207140655215574, "eval_recall": 0.5370942812982998, "eval_runtime": 10.2542, "eval_samples_per_second": 126.192, "eval_steps_per_second": 2.048, "step": 160 }, { "epoch": 8.49, "learning_rate": 7.666666666666667e-05, "loss": 1.1204, "step": 170 }, { "epoch": 8.99, "learning_rate": 7.333333333333334e-05, "loss": 1.0679, "step": 180 }, { "epoch": 8.99, "eval_accuracy": 0.5718701700154559, "eval_f1": 0.48309150932194556, "eval_loss": 1.0824542045593262, "eval_precision": 0.44653696889067535, "eval_recall": 0.5718701700154559, "eval_runtime": 10.0099, "eval_samples_per_second": 129.272, "eval_steps_per_second": 2.098, "step": 180 }, { "epoch": 9.49, "learning_rate": 7.000000000000001e-05, "loss": 1.0551, "step": 190 }, { "epoch": 9.99, "learning_rate": 6.666666666666667e-05, "loss": 1.0432, "step": 200 }, { "epoch": 9.99, "eval_accuracy": 0.5749613601236476, "eval_f1": 0.4930062944584295, "eval_loss": 1.0481715202331543, "eval_precision": 0.5404301068833355, "eval_recall": 0.5749613601236476, "eval_runtime": 19.2474, "eval_samples_per_second": 67.23, "eval_steps_per_second": 1.091, "step": 200 }, { "epoch": 10.49, "learning_rate": 6.333333333333333e-05, "loss": 1.0465, "step": 210 }, { "epoch": 10.99, "learning_rate": 6e-05, "loss": 0.9903, "step": 220 }, { "epoch": 10.99, "eval_accuracy": 0.5958268933539412, "eval_f1": 0.5240773887363929, "eval_loss": 1.0275342464447021, "eval_precision": 0.545875829974407, "eval_recall": 0.5958268933539412, "eval_runtime": 9.9464, "eval_samples_per_second": 130.097, "eval_steps_per_second": 2.111, "step": 220 }, { "epoch": 11.49, "learning_rate": 5.6666666666666664e-05, "loss": 1.0046, "step": 230 }, { "epoch": 11.99, "learning_rate": 5.333333333333333e-05, "loss": 0.9675, "step": 240 }, { "epoch": 11.99, "eval_accuracy": 0.6051004636785162, "eval_f1": 0.5379053813016494, "eval_loss": 1.0145165920257568, "eval_precision": 0.5349771722020813, "eval_recall": 0.6051004636785162, "eval_runtime": 10.1612, "eval_samples_per_second": 127.347, "eval_steps_per_second": 2.067, "step": 240 }, { "epoch": 12.49, "learning_rate": 5e-05, "loss": 0.997, "step": 250 }, { "epoch": 12.99, "learning_rate": 4.666666666666667e-05, "loss": 0.9335, "step": 260 }, { "epoch": 12.99, "eval_accuracy": 0.6174652241112828, "eval_f1": 0.552720253591733, "eval_loss": 0.9859771728515625, "eval_precision": 0.5536990181229813, "eval_recall": 0.6174652241112828, "eval_runtime": 11.4078, "eval_samples_per_second": 113.431, "eval_steps_per_second": 1.841, "step": 260 }, { "epoch": 13.49, "learning_rate": 4.3333333333333334e-05, "loss": 0.9501, "step": 270 }, { "epoch": 13.99, "learning_rate": 3.9999999999999996e-05, "loss": 0.9157, "step": 280 }, { "epoch": 13.99, "eval_accuracy": 0.6105100463678517, "eval_f1": 0.5504384069346341, "eval_loss": 0.9683175683021545, "eval_precision": 0.5386397521561105, "eval_recall": 0.6105100463678517, "eval_runtime": 10.0837, "eval_samples_per_second": 128.326, "eval_steps_per_second": 2.083, "step": 280 }, { "epoch": 14.49, "learning_rate": 3.666666666666667e-05, "loss": 0.9324, "step": 290 }, { "epoch": 14.99, "learning_rate": 3.3333333333333335e-05, "loss": 0.8901, "step": 300 }, { "epoch": 14.99, "eval_accuracy": 0.6352395672333848, "eval_f1": 0.5833124251549139, "eval_loss": 0.95584636926651, "eval_precision": 0.5686172096380677, "eval_recall": 0.6352395672333848, "eval_runtime": 11.1778, "eval_samples_per_second": 115.766, "eval_steps_per_second": 1.879, "step": 300 }, { "epoch": 15.49, "learning_rate": 3e-05, "loss": 0.9157, "step": 310 }, { "epoch": 15.99, "learning_rate": 2.6666666666666667e-05, "loss": 0.8722, "step": 320 }, { "epoch": 15.99, "eval_accuracy": 0.634466769706337, "eval_f1": 0.5807225066585998, "eval_loss": 0.9381548762321472, "eval_precision": 0.5656504472537988, "eval_recall": 0.634466769706337, "eval_runtime": 10.0783, "eval_samples_per_second": 128.395, "eval_steps_per_second": 2.084, "step": 320 }, { "epoch": 16.49, "learning_rate": 2.3333333333333336e-05, "loss": 0.9132, "step": 330 }, { "epoch": 16.99, "learning_rate": 1.9999999999999998e-05, "loss": 0.854, "step": 340 }, { "epoch": 16.99, "eval_accuracy": 0.6375579598145286, "eval_f1": 0.5855599844273062, "eval_loss": 0.9322208166122437, "eval_precision": 0.5622591012744048, "eval_recall": 0.6375579598145286, "eval_runtime": 10.1911, "eval_samples_per_second": 126.973, "eval_steps_per_second": 2.061, "step": 340 }, { "epoch": 17.49, "learning_rate": 1.6666666666666667e-05, "loss": 0.8979, "step": 350 }, { "epoch": 17.99, "learning_rate": 1.3333333333333333e-05, "loss": 0.8494, "step": 360 }, { "epoch": 17.99, "eval_accuracy": 0.6421947449768161, "eval_f1": 0.5918308732628852, "eval_loss": 0.9286540746688843, "eval_precision": 0.6675486262621129, "eval_recall": 0.6421947449768161, "eval_runtime": 11.41, "eval_samples_per_second": 113.409, "eval_steps_per_second": 1.84, "step": 360 }, { "epoch": 18.49, "learning_rate": 9.999999999999999e-06, "loss": 0.8649, "step": 370 }, { "epoch": 18.99, "learning_rate": 6.666666666666667e-06, "loss": 0.8652, "step": 380 }, { "epoch": 18.99, "eval_accuracy": 0.6398763523956723, "eval_f1": 0.586308244884445, "eval_loss": 0.9211938977241516, "eval_precision": 0.5640414016020209, "eval_recall": 0.6398763523956723, "eval_runtime": 10.0413, "eval_samples_per_second": 128.867, "eval_steps_per_second": 2.091, "step": 380 }, { "epoch": 19.49, "learning_rate": 3.3333333333333333e-06, "loss": 0.8826, "step": 390 }, { "epoch": 19.99, "learning_rate": 0.0, "loss": 0.846, "step": 400 }, { "epoch": 19.99, "eval_accuracy": 0.6452859350850078, "eval_f1": 0.5963647629954705, "eval_loss": 0.9262650012969971, "eval_precision": 0.5727919568038408, "eval_recall": 0.6452859350850078, "eval_runtime": 10.2246, "eval_samples_per_second": 126.557, "eval_steps_per_second": 2.054, "step": 400 }, { "epoch": 19.99, "step": 400, "total_flos": 2.1968670326740623e+18, "train_loss": 1.0949385786056518, "train_runtime": 1181.8167, "train_samples_per_second": 87.56, "train_steps_per_second": 0.338 } ], "max_steps": 400, "num_train_epochs": 20, "total_flos": 2.1968670326740623e+18, "trial_name": null, "trial_params": null }