{ "best_metric": 0.07841455936431885, "best_model_checkpoint": "./vit-base-beans/checkpoint-280", "epoch": 0.7608695652173914, "global_step": 280, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.03, "learning_rate": 0.00019322033898305085, "loss": 0.6554, "step": 10 }, { "epoch": 0.05, "learning_rate": 0.0001864406779661017, "loss": 0.306, "step": 20 }, { "epoch": 0.08, "learning_rate": 0.00017966101694915257, "loss": 0.267, "step": 30 }, { "epoch": 0.11, "learning_rate": 0.00017288135593220342, "loss": 0.2825, "step": 40 }, { "epoch": 0.11, "eval_accuracy": 0.9318801089918256, "eval_loss": 0.2294050008058548, "eval_runtime": 16.8062, "eval_samples_per_second": 43.674, "eval_steps_per_second": 5.474, "step": 40 }, { "epoch": 0.14, "learning_rate": 0.00016610169491525423, "loss": 0.3097, "step": 50 }, { "epoch": 0.16, "learning_rate": 0.00015932203389830508, "loss": 0.2772, "step": 60 }, { "epoch": 0.19, "learning_rate": 0.00015254237288135592, "loss": 0.1711, "step": 70 }, { "epoch": 0.22, "learning_rate": 0.00014576271186440677, "loss": 0.1483, "step": 80 }, { "epoch": 0.22, "eval_accuracy": 0.944141689373297, "eval_loss": 0.16020944714546204, "eval_runtime": 17.3798, "eval_samples_per_second": 42.233, "eval_steps_per_second": 5.294, "step": 80 }, { "epoch": 0.24, "learning_rate": 0.00013898305084745764, "loss": 0.2356, "step": 90 }, { "epoch": 0.27, "learning_rate": 0.00013220338983050849, "loss": 0.1144, "step": 100 }, { "epoch": 0.3, "learning_rate": 0.00012542372881355933, "loss": 0.2216, "step": 110 }, { "epoch": 0.33, "learning_rate": 0.00011864406779661017, "loss": 0.2209, "step": 120 }, { "epoch": 0.33, "eval_accuracy": 0.829700272479564, "eval_loss": 0.29767370223999023, "eval_runtime": 17.13, "eval_samples_per_second": 42.849, "eval_steps_per_second": 5.371, "step": 120 }, { "epoch": 0.35, "learning_rate": 0.00011186440677966102, "loss": 0.2153, "step": 130 }, { "epoch": 0.38, "learning_rate": 0.00010508474576271188, "loss": 0.1693, "step": 140 }, { "epoch": 0.41, "learning_rate": 9.830508474576272e-05, "loss": 0.1625, "step": 150 }, { "epoch": 0.43, "learning_rate": 9.152542372881357e-05, "loss": 0.1384, "step": 160 }, { "epoch": 0.43, "eval_accuracy": 0.9645776566757494, "eval_loss": 0.10578873753547668, "eval_runtime": 16.6083, "eval_samples_per_second": 44.195, "eval_steps_per_second": 5.539, "step": 160 }, { "epoch": 0.46, "learning_rate": 8.474576271186441e-05, "loss": 0.1371, "step": 170 }, { "epoch": 0.49, "learning_rate": 7.796610169491526e-05, "loss": 0.1355, "step": 180 }, { "epoch": 0.52, "learning_rate": 7.11864406779661e-05, "loss": 0.1557, "step": 190 }, { "epoch": 0.54, "learning_rate": 6.440677966101695e-05, "loss": 0.1551, "step": 200 }, { "epoch": 0.54, "eval_accuracy": 0.9114441416893733, "eval_loss": 0.1725204885005951, "eval_runtime": 17.0671, "eval_samples_per_second": 43.007, "eval_steps_per_second": 5.39, "step": 200 }, { "epoch": 0.57, "learning_rate": 5.76271186440678e-05, "loss": 0.2091, "step": 210 }, { "epoch": 0.6, "learning_rate": 5.0847457627118643e-05, "loss": 0.1313, "step": 220 }, { "epoch": 0.62, "learning_rate": 4.4067796610169495e-05, "loss": 0.1056, "step": 230 }, { "epoch": 0.65, "learning_rate": 3.728813559322034e-05, "loss": 0.1608, "step": 240 }, { "epoch": 0.65, "eval_accuracy": 0.9673024523160763, "eval_loss": 0.09211871027946472, "eval_runtime": 16.6063, "eval_samples_per_second": 44.2, "eval_steps_per_second": 5.54, "step": 240 }, { "epoch": 0.68, "learning_rate": 3.050847457627119e-05, "loss": 0.0761, "step": 250 }, { "epoch": 0.71, "learning_rate": 2.3728813559322036e-05, "loss": 0.1044, "step": 260 }, { "epoch": 0.73, "learning_rate": 1.694915254237288e-05, "loss": 0.1141, "step": 270 }, { "epoch": 0.76, "learning_rate": 1.016949152542373e-05, "loss": 0.12, "step": 280 }, { "epoch": 0.76, "eval_accuracy": 0.9754768392370572, "eval_loss": 0.07841455936431885, "eval_runtime": 16.7459, "eval_samples_per_second": 43.832, "eval_steps_per_second": 5.494, "step": 280 } ], "max_steps": 295, "num_train_epochs": 1, "total_flos": 3.471672249955123e+17, "trial_name": null, "trial_params": null }