{ "best_metric": 0.908256880733945, "best_model_checkpoint": "google-vit-base-patch16-224-cartoon-emotion-detection/checkpoint-128", "epoch": 19.96969696969697, "global_step": 160, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.97, "eval_accuracy": 0.5779816513761468, "eval_f1": 0.5496044478283086, "eval_loss": 1.0942180156707764, "eval_precision": 0.6101578737429934, "eval_recall": 0.5779816513761468, "eval_runtime": 6.1545, "eval_samples_per_second": 17.711, "eval_steps_per_second": 0.325, "step": 8 }, { "epoch": 1.24, "learning_rate": 7.500000000000001e-05, "loss": 1.3198, "step": 10 }, { "epoch": 1.97, "eval_accuracy": 0.7614678899082569, "eval_f1": 0.7493394355240011, "eval_loss": 0.6914369463920593, "eval_precision": 0.7497958611640302, "eval_recall": 0.7614678899082569, "eval_runtime": 4.6109, "eval_samples_per_second": 23.64, "eval_steps_per_second": 0.434, "step": 16 }, { "epoch": 2.48, "learning_rate": 0.00011666666666666667, "loss": 0.6694, "step": 20 }, { "epoch": 2.97, "eval_accuracy": 0.7889908256880734, "eval_f1": 0.7780956547838787, "eval_loss": 0.47017431259155273, "eval_precision": 0.7808396335677842, "eval_recall": 0.7889908256880734, "eval_runtime": 5.0072, "eval_samples_per_second": 21.769, "eval_steps_per_second": 0.399, "step": 24 }, { "epoch": 3.73, "learning_rate": 0.00010833333333333334, "loss": 0.2725, "step": 30 }, { "epoch": 3.97, "eval_accuracy": 0.8532110091743119, "eval_f1": 0.852182928635528, "eval_loss": 0.3957468569278717, "eval_precision": 0.8513973454558302, "eval_recall": 0.8532110091743119, "eval_runtime": 5.1072, "eval_samples_per_second": 21.342, "eval_steps_per_second": 0.392, "step": 32 }, { "epoch": 4.97, "learning_rate": 0.0001, "loss": 0.1116, "step": 40 }, { "epoch": 4.97, "eval_accuracy": 0.8715596330275229, "eval_f1": 0.8693196656152253, "eval_loss": 0.3428177833557129, "eval_precision": 0.8696674261696613, "eval_recall": 0.8715596330275229, "eval_runtime": 4.6559, "eval_samples_per_second": 23.411, "eval_steps_per_second": 0.43, "step": 40 }, { "epoch": 5.97, "eval_accuracy": 0.8532110091743119, "eval_f1": 0.852182928635528, "eval_loss": 0.38648203015327454, "eval_precision": 0.8513973454558302, "eval_recall": 0.8532110091743119, "eval_runtime": 4.7748, "eval_samples_per_second": 22.828, "eval_steps_per_second": 0.419, "step": 48 }, { "epoch": 6.24, "learning_rate": 9.166666666666667e-05, "loss": 0.0486, "step": 50 }, { "epoch": 6.97, "eval_accuracy": 0.8532110091743119, "eval_f1": 0.8506716755357531, "eval_loss": 0.3445301055908203, "eval_precision": 0.8494739768520552, "eval_recall": 0.8532110091743119, "eval_runtime": 4.611, "eval_samples_per_second": 23.639, "eval_steps_per_second": 0.434, "step": 56 }, { "epoch": 7.48, "learning_rate": 8.333333333333333e-05, "loss": 0.0346, "step": 60 }, { "epoch": 7.97, "eval_accuracy": 0.8807339449541285, "eval_f1": 0.8831061019446504, "eval_loss": 0.35539454221725464, "eval_precision": 0.8921137072355041, "eval_recall": 0.8807339449541285, "eval_runtime": 5.4806, "eval_samples_per_second": 19.888, "eval_steps_per_second": 0.365, "step": 64 }, { "epoch": 8.73, "learning_rate": 7.500000000000001e-05, "loss": 0.0304, "step": 70 }, { "epoch": 8.97, "eval_accuracy": 0.8623853211009175, "eval_f1": 0.8605019312208758, "eval_loss": 0.3100130259990692, "eval_precision": 0.859227121302747, "eval_recall": 0.8623853211009175, "eval_runtime": 4.4858, "eval_samples_per_second": 24.299, "eval_steps_per_second": 0.446, "step": 72 }, { "epoch": 9.97, "learning_rate": 6.666666666666667e-05, "loss": 0.0215, "step": 80 }, { "epoch": 9.97, "eval_accuracy": 0.8715596330275229, "eval_f1": 0.8706535281458829, "eval_loss": 0.3717760443687439, "eval_precision": 0.8700050641259672, "eval_recall": 0.8715596330275229, "eval_runtime": 4.4596, "eval_samples_per_second": 24.442, "eval_steps_per_second": 0.448, "step": 80 }, { "epoch": 10.97, "eval_accuracy": 0.8899082568807339, "eval_f1": 0.8896213803351865, "eval_loss": 0.3945842683315277, "eval_precision": 0.8901151962474995, "eval_recall": 0.8899082568807339, "eval_runtime": 4.3806, "eval_samples_per_second": 24.882, "eval_steps_per_second": 0.457, "step": 88 }, { "epoch": 11.24, "learning_rate": 5.833333333333333e-05, "loss": 0.0201, "step": 90 }, { "epoch": 11.97, "eval_accuracy": 0.8532110091743119, "eval_f1": 0.8523968233405174, "eval_loss": 0.45045793056488037, "eval_precision": 0.8557594291539246, "eval_recall": 0.8532110091743119, "eval_runtime": 4.5094, "eval_samples_per_second": 24.172, "eval_steps_per_second": 0.444, "step": 96 }, { "epoch": 12.48, "learning_rate": 5e-05, "loss": 0.02, "step": 100 }, { "epoch": 12.97, "eval_accuracy": 0.8715596330275229, "eval_f1": 0.8718071382402676, "eval_loss": 0.45429742336273193, "eval_precision": 0.8734266859810075, "eval_recall": 0.8715596330275229, "eval_runtime": 4.3136, "eval_samples_per_second": 25.269, "eval_steps_per_second": 0.464, "step": 104 }, { "epoch": 13.73, "learning_rate": 4.1666666666666665e-05, "loss": 0.0181, "step": 110 }, { "epoch": 13.97, "eval_accuracy": 0.8899082568807339, "eval_f1": 0.8884082118557669, "eval_loss": 0.38368093967437744, "eval_precision": 0.887776250789288, "eval_recall": 0.8899082568807339, "eval_runtime": 5.0241, "eval_samples_per_second": 21.695, "eval_steps_per_second": 0.398, "step": 112 }, { "epoch": 14.97, "learning_rate": 3.3333333333333335e-05, "loss": 0.0158, "step": 120 }, { "epoch": 14.97, "eval_accuracy": 0.8715596330275229, "eval_f1": 0.8690629924501888, "eval_loss": 0.39043566584587097, "eval_precision": 0.8676131770089379, "eval_recall": 0.8715596330275229, "eval_runtime": 4.6243, "eval_samples_per_second": 23.571, "eval_steps_per_second": 0.432, "step": 120 }, { "epoch": 15.97, "eval_accuracy": 0.908256880733945, "eval_f1": 0.9076765848444429, "eval_loss": 0.38814032077789307, "eval_precision": 0.9077606207554442, "eval_recall": 0.908256880733945, "eval_runtime": 4.4737, "eval_samples_per_second": 24.364, "eval_steps_per_second": 0.447, "step": 128 }, { "epoch": 16.24, "learning_rate": 2.5e-05, "loss": 0.0147, "step": 130 }, { "epoch": 16.97, "eval_accuracy": 0.8807339449541285, "eval_f1": 0.8785402173459473, "eval_loss": 0.4233301281929016, "eval_precision": 0.877296042811741, "eval_recall": 0.8807339449541285, "eval_runtime": 5.5943, "eval_samples_per_second": 19.484, "eval_steps_per_second": 0.358, "step": 136 }, { "epoch": 17.48, "learning_rate": 1.6666666666666667e-05, "loss": 0.0138, "step": 140 }, { "epoch": 17.97, "eval_accuracy": 0.8715596330275229, "eval_f1": 0.8706535281458829, "eval_loss": 0.4334617853164673, "eval_precision": 0.8700050641259672, "eval_recall": 0.8715596330275229, "eval_runtime": 4.4249, "eval_samples_per_second": 24.634, "eval_steps_per_second": 0.452, "step": 144 }, { "epoch": 18.73, "learning_rate": 8.333333333333334e-06, "loss": 0.0166, "step": 150 }, { "epoch": 18.97, "eval_accuracy": 0.8715596330275229, "eval_f1": 0.8701110574601642, "eval_loss": 0.44918692111968994, "eval_precision": 0.8689788374764814, "eval_recall": 0.8715596330275229, "eval_runtime": 4.6129, "eval_samples_per_second": 23.629, "eval_steps_per_second": 0.434, "step": 152 }, { "epoch": 19.97, "learning_rate": 0.0, "loss": 0.016, "step": 160 }, { "epoch": 19.97, "eval_accuracy": 0.8715596330275229, "eval_f1": 0.871683140929764, "eval_loss": 0.4169996976852417, "eval_precision": 0.8725197999744695, "eval_recall": 0.8715596330275229, "eval_runtime": 4.5712, "eval_samples_per_second": 23.845, "eval_steps_per_second": 0.438, "step": 160 }, { "epoch": 19.97, "step": 160, "total_flos": 3.206521023309693e+18, "train_loss": 0.16520703649148344, "train_runtime": 938.1956, "train_samples_per_second": 44.127, "train_steps_per_second": 0.171 } ], "max_steps": 160, "num_train_epochs": 20, "total_flos": 3.206521023309693e+18, "trial_name": null, "trial_params": null }