{ "best_metric": 0.12063875794410706, "best_model_checkpoint": "./vit-base-beans/checkpoint-160", "epoch": 0.43478260869565216, "global_step": 160, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.03, "learning_rate": 0.0001891304347826087, "loss": 0.6558, "step": 10 }, { "epoch": 0.05, "learning_rate": 0.0001782608695652174, "loss": 0.3045, "step": 20 }, { "epoch": 0.08, "learning_rate": 0.0001673913043478261, "loss": 0.2567, "step": 30 }, { "epoch": 0.11, "learning_rate": 0.0001565217391304348, "loss": 0.2319, "step": 40 }, { "epoch": 0.11, "eval_accuracy": 0.8637602179836512, "eval_loss": 0.2531130313873291, "eval_runtime": 17.2839, "eval_samples_per_second": 42.467, "eval_steps_per_second": 5.323, "step": 40 }, { "epoch": 0.14, "learning_rate": 0.0001456521739130435, "loss": 0.2499, "step": 50 }, { "epoch": 0.16, "learning_rate": 0.0001347826086956522, "loss": 0.2874, "step": 60 }, { "epoch": 0.19, "learning_rate": 0.00012391304347826086, "loss": 0.1609, "step": 70 }, { "epoch": 0.22, "learning_rate": 0.00011304347826086956, "loss": 0.1306, "step": 80 }, { "epoch": 0.22, "eval_accuracy": 0.9564032697547684, "eval_loss": 0.1377830058336258, "eval_runtime": 17.1335, "eval_samples_per_second": 42.84, "eval_steps_per_second": 5.37, "step": 80 }, { "epoch": 0.24, "learning_rate": 0.00010217391304347828, "loss": 0.228, "step": 90 }, { "epoch": 0.27, "learning_rate": 9.130434782608696e-05, "loss": 0.1187, "step": 100 }, { "epoch": 0.3, "learning_rate": 8.043478260869566e-05, "loss": 0.1811, "step": 110 }, { "epoch": 0.33, "learning_rate": 6.956521739130436e-05, "loss": 0.2075, "step": 120 }, { "epoch": 0.33, "eval_accuracy": 0.8419618528610354, "eval_loss": 0.3006892800331116, "eval_runtime": 17.1056, "eval_samples_per_second": 42.91, "eval_steps_per_second": 5.378, "step": 120 }, { "epoch": 0.35, "learning_rate": 5.869565217391305e-05, "loss": 0.2099, "step": 130 }, { "epoch": 0.38, "learning_rate": 4.782608695652174e-05, "loss": 0.1518, "step": 140 }, { "epoch": 0.41, "learning_rate": 3.695652173913043e-05, "loss": 0.1559, "step": 150 }, { "epoch": 0.43, "learning_rate": 2.608695652173913e-05, "loss": 0.1573, "step": 160 }, { "epoch": 0.43, "eval_accuracy": 0.9618528610354223, "eval_loss": 0.12063875794410706, "eval_runtime": 16.7256, "eval_samples_per_second": 43.885, "eval_steps_per_second": 5.501, "step": 160 } ], "max_steps": 184, "num_train_epochs": 1, "total_flos": 1.9838127142600704e+17, "trial_name": null, "trial_params": null }