{ "best_metric": null, "best_model_checkpoint": null, "epoch": 2.0, "global_step": 500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.9992e-05, "loss": 2.3035, "step": 1 }, { "epoch": 0.5, "learning_rate": 1.9e-05, "loss": 2.1461, "step": 125 }, { "epoch": 0.5, "eval_accuracy": 0.5465, "eval_disk_space_total": 78.1898422241211, "eval_disk_space_used": 24.584102630615234, "eval_f1": 0.4711252488920671, "eval_gpu_ram_allocated": 0.3996291160583496, "eval_gpu_ram_cached": 12.9296875, "eval_gpu_ram_total": 39.56402587890625, "eval_gpu_utilization": 28, "eval_loss": 1.8486889600753784, "eval_precision": 0.5180898369172832, "eval_recall": 0.5465, "eval_runtime": 1.5234, "eval_samples_per_second": 1312.845, "eval_steps_per_second": 41.355, "eval_system_ram_total": 83.48074722290039, "eval_system_ram_used": 3.8797760009765625, "step": 125 }, { "epoch": 1.0, "learning_rate": 1.8e-05, "loss": 1.6793, "step": 250 }, { "epoch": 1.0, "eval_accuracy": 0.615, "eval_disk_space_total": 78.1898422241211, "eval_disk_space_used": 24.584190368652344, "eval_f1": 0.5799151958404197, "eval_gpu_ram_allocated": 0.3996119499206543, "eval_gpu_ram_cached": 12.9296875, "eval_gpu_ram_total": 39.56402587890625, "eval_gpu_utilization": 28, "eval_loss": 1.5279773473739624, "eval_precision": 0.6206909881233017, "eval_recall": 0.615, "eval_runtime": 1.5357, "eval_samples_per_second": 1302.337, "eval_steps_per_second": 41.024, "eval_system_ram_total": 83.48074722290039, "eval_system_ram_used": 3.8827476501464844, "step": 250 }, { "epoch": 1.5, "learning_rate": 1.7e-05, "loss": 1.4163, "step": 375 }, { "epoch": 1.5, "eval_accuracy": 0.6675, "eval_disk_space_total": 78.1898422241211, "eval_disk_space_used": 24.584190368652344, "eval_f1": 0.6507803054121275, "eval_gpu_ram_allocated": 0.3996291160583496, "eval_gpu_ram_cached": 12.9296875, "eval_gpu_ram_total": 39.56402587890625, "eval_gpu_utilization": 28, "eval_loss": 1.3395830392837524, "eval_precision": 0.6690538200035159, "eval_recall": 0.6675, "eval_runtime": 1.5175, "eval_samples_per_second": 1317.927, "eval_steps_per_second": 41.515, "eval_system_ram_total": 83.48074722290039, "eval_system_ram_used": 3.883075714111328, "step": 375 }, { "epoch": 2.0, "learning_rate": 1.6000000000000003e-05, "loss": 1.2855, "step": 500 }, { "epoch": 2.0, "eval_accuracy": 0.6745, "eval_disk_space_total": 78.1898422241211, "eval_disk_space_used": 24.584270477294922, "eval_f1": 0.6633189544214071, "eval_gpu_ram_allocated": 0.3995933532714844, "eval_gpu_ram_cached": 12.9296875, "eval_gpu_ram_total": 39.56402587890625, "eval_gpu_utilization": 30, "eval_loss": 1.2413243055343628, "eval_precision": 0.6741774761001332, "eval_recall": 0.6745, "eval_runtime": 1.5166, "eval_samples_per_second": 1318.761, "eval_steps_per_second": 41.541, "eval_system_ram_total": 83.48074722290039, "eval_system_ram_used": 3.897541046142578, "step": 500 } ], "max_steps": 2500, "num_train_epochs": 10, "total_flos": 252176442301056.0, "trial_name": null, "trial_params": null }