{ "best_metric": 0.14495012164115906, "best_model_checkpoint": "./test-small-bert-with-loss-weight/checkpoint-1500", "epoch": 1.968503937007874, "global_step": 2000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.49, "learning_rate": 4.1797900262467194e-05, "loss": 0.1546, "step": 500 }, { "epoch": 0.49, "eval_accuracy": 0.8429757067519668, "eval_f1": 0.27041574613376174, "eval_loss": 0.14738939702510834, "eval_precision": 0.8877752868257945, "eval_recall": 0.1594996090695856, "eval_runtime": 8.7195, "eval_samples_per_second": 1128.732, "eval_steps_per_second": 4.473, "step": 500 }, { "epoch": 0.98, "learning_rate": 3.3595800524934386e-05, "loss": 0.1506, "step": 1000 }, { "epoch": 0.98, "eval_accuracy": 0.8417091726463214, "eval_f1": 0.2548480963718129, "eval_loss": 0.14584653079509735, "eval_precision": 0.9028258362168397, "eval_recall": 0.14836401544767455, "eval_runtime": 8.6401, "eval_samples_per_second": 1139.107, "eval_steps_per_second": 4.514, "step": 1000 }, { "epoch": 1.48, "learning_rate": 2.5393700787401574e-05, "loss": 0.1485, "step": 1500 }, { "epoch": 1.48, "eval_accuracy": 0.8470173770208351, "eval_f1": 0.30824260667305176, "eval_loss": 0.14495012164115906, "eval_precision": 0.8806120169756534, "eval_recall": 0.18681735257184828, "eval_runtime": 8.8318, "eval_samples_per_second": 1114.387, "eval_steps_per_second": 4.416, "step": 1500 }, { "epoch": 1.97, "learning_rate": 1.7191601049868766e-05, "loss": 0.1487, "step": 2000 }, { "epoch": 1.97, "eval_accuracy": 0.8434339068038385, "eval_f1": 0.27119803613827514, "eval_loss": 0.14501141011714935, "eval_precision": 0.8996128687758643, "eval_recall": 0.15966545833629492, "eval_runtime": 8.7797, "eval_samples_per_second": 1120.994, "eval_steps_per_second": 4.442, "step": 2000 } ], "max_steps": 3048, "num_train_epochs": 3, "total_flos": 621176549989632.0, "trial_name": null, "trial_params": null }