{ "best_metric": 0.876997915218902, "best_model_checkpoint": "bert-multilabel-tagalog-hate-speech-classifier/checkpoint-790", "epoch": 5.0, "eval_steps": 500, "global_step": 790, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.4650793650793651, "eval_f1": 0.6538124452234881, "eval_loss": 0.2858085036277771, "eval_roc_auc": 0.749062395824874, "eval_runtime": 16.739, "eval_samples_per_second": 37.637, "eval_steps_per_second": 4.72, "step": 158 }, { "epoch": 2.0, "eval_accuracy": 0.7285714285714285, "eval_f1": 0.8368690563277249, "eval_loss": 0.1806272566318512, "eval_roc_auc": 0.8807496256986324, "eval_runtime": 16.7646, "eval_samples_per_second": 37.579, "eval_steps_per_second": 4.712, "step": 316 }, { "epoch": 3.0, "eval_accuracy": 0.7682539682539683, "eval_f1": 0.8638631503920171, "eval_loss": 0.14880089461803436, "eval_roc_auc": 0.9036774632664203, "eval_runtime": 17.0606, "eval_samples_per_second": 36.927, "eval_steps_per_second": 4.631, "step": 474 }, { "epoch": 3.1645569620253164, "grad_norm": 1.8442691564559937, "learning_rate": 7.341772151898735e-06, "loss": 0.2518, "step": 500 }, { "epoch": 4.0, "eval_accuracy": 0.7761904761904762, "eval_f1": 0.8720848056537103, "eval_loss": 0.14489033818244934, "eval_roc_auc": 0.911037414882052, "eval_runtime": 17.6671, "eval_samples_per_second": 35.66, "eval_steps_per_second": 4.472, "step": 632 }, { "epoch": 5.0, "eval_accuracy": 0.780952380952381, "eval_f1": 0.876997915218902, "eval_loss": 0.13758358359336853, "eval_roc_auc": 0.9189734563461635, "eval_runtime": 17.8108, "eval_samples_per_second": 35.372, "eval_steps_per_second": 4.436, "step": 790 } ], "logging_steps": 500, "max_steps": 790, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 414414795110400.0, "train_batch_size": 8, "trial_name": null, "trial_params": null }