djbp's picture
End of training
718277b verified
raw
history blame
6.21 kB
{
"best_metric": 0.5,
"best_model_checkpoint": "swin-base-patch4-window7-224-in22k-cons_Classification_base_V10/checkpoint-2",
"epoch": 7.0,
"eval_steps": 500,
"global_step": 7,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"step": 1,
"train_accuracy": 0.2,
"train_auc_class_0": 0.45999999999999996,
"train_auc_class_1": 0.28,
"train_auc_class_2": 0.38,
"train_auc_overall": 0.37333333333333335,
"train_loss": 1.2419202327728271,
"train_runtime": 1.6771,
"train_samples_per_second": 8.944,
"train_steps_per_second": 0.596
},
{
"epoch": 1.0,
"eval_accuracy": 0.0,
"eval_auc_class_0": 0.5,
"eval_auc_class_1": 0.25,
"eval_auc_class_2": 0.5,
"eval_auc_overall": 0.4166666666666667,
"eval_loss": 1.1770787239074707,
"eval_runtime": 0.97,
"eval_samples_per_second": 6.185,
"eval_steps_per_second": 1.031,
"step": 1
},
{
"epoch": 2.0,
"step": 2,
"train_accuracy": 0.6666666666666666,
"train_auc_class_0": 0.82,
"train_auc_class_1": 0.92,
"train_auc_class_2": 0.86,
"train_auc_overall": 0.8666666666666667,
"train_loss": 0.8910435438156128,
"train_runtime": 1.6903,
"train_samples_per_second": 8.874,
"train_steps_per_second": 0.592
},
{
"epoch": 2.0,
"eval_accuracy": 0.5,
"eval_auc_class_0": 0.5,
"eval_auc_class_1": 0.625,
"eval_auc_class_2": 0.625,
"eval_auc_overall": 0.5833333333333334,
"eval_loss": 1.09449303150177,
"eval_runtime": 0.7379,
"eval_samples_per_second": 8.132,
"eval_steps_per_second": 1.355,
"step": 2
},
{
"epoch": 3.0,
"step": 3,
"train_accuracy": 0.8666666666666667,
"train_auc_class_0": 0.98,
"train_auc_class_1": 1.0,
"train_auc_class_2": 0.98,
"train_auc_overall": 0.9866666666666667,
"train_loss": 0.6887053847312927,
"train_runtime": 1.7287,
"train_samples_per_second": 8.677,
"train_steps_per_second": 0.578
},
{
"epoch": 3.0,
"eval_accuracy": 0.5,
"eval_auc_class_0": 0.5,
"eval_auc_class_1": 0.75,
"eval_auc_class_2": 0.75,
"eval_auc_overall": 0.6666666666666666,
"eval_loss": 1.030716896057129,
"eval_runtime": 0.7962,
"eval_samples_per_second": 7.536,
"eval_steps_per_second": 1.256,
"step": 3
},
{
"epoch": 4.0,
"step": 4,
"train_accuracy": 1.0,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.5273771286010742,
"train_runtime": 1.7311,
"train_samples_per_second": 8.665,
"train_steps_per_second": 0.578
},
{
"epoch": 4.0,
"eval_accuracy": 0.5,
"eval_auc_class_0": 0.75,
"eval_auc_class_1": 0.875,
"eval_auc_class_2": 0.875,
"eval_auc_overall": 0.8333333333333334,
"eval_loss": 0.9745334982872009,
"eval_runtime": 0.708,
"eval_samples_per_second": 8.474,
"eval_steps_per_second": 1.412,
"step": 4
},
{
"epoch": 5.0,
"step": 5,
"train_accuracy": 1.0,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.4640212059020996,
"train_runtime": 1.7287,
"train_samples_per_second": 8.677,
"train_steps_per_second": 0.578
},
{
"epoch": 5.0,
"eval_accuracy": 0.5,
"eval_auc_class_0": 0.75,
"eval_auc_class_1": 0.875,
"eval_auc_class_2": 0.875,
"eval_auc_overall": 0.8333333333333334,
"eval_loss": 0.928966224193573,
"eval_runtime": 0.7026,
"eval_samples_per_second": 8.54,
"eval_steps_per_second": 1.423,
"step": 5
},
{
"epoch": 6.0,
"step": 6,
"train_accuracy": 0.9333333333333333,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.4194321036338806,
"train_runtime": 1.7268,
"train_samples_per_second": 8.687,
"train_steps_per_second": 0.579
},
{
"epoch": 6.0,
"eval_accuracy": 0.5,
"eval_auc_class_0": 0.75,
"eval_auc_class_1": 1.0,
"eval_auc_class_2": 0.875,
"eval_auc_overall": 0.875,
"eval_loss": 0.8979067206382751,
"eval_runtime": 0.6949,
"eval_samples_per_second": 8.634,
"eval_steps_per_second": 1.439,
"step": 6
},
{
"epoch": 7.0,
"step": 7,
"train_accuracy": 1.0,
"train_auc_class_0": 1.0,
"train_auc_class_1": 1.0,
"train_auc_class_2": 1.0,
"train_auc_overall": 1.0,
"train_loss": 0.402330219745636,
"train_runtime": 1.8612,
"train_samples_per_second": 8.059,
"train_steps_per_second": 0.537
},
{
"epoch": 7.0,
"eval_accuracy": 0.5,
"eval_auc_class_0": 0.875,
"eval_auc_class_1": 1.0,
"eval_auc_class_2": 0.875,
"eval_auc_overall": 0.9166666666666666,
"eval_loss": 0.8809628486633301,
"eval_runtime": 0.7654,
"eval_samples_per_second": 7.839,
"eval_steps_per_second": 1.306,
"step": 7
},
{
"epoch": 7.0,
"step": 7,
"total_flos": 8226380544399360.0,
"train_loss": 0.1908613954271589,
"train_runtime": 147.7634,
"train_samples_per_second": 0.711,
"train_steps_per_second": 0.047
}
],
"logging_steps": 10,
"max_steps": 7,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 8226380544399360.0,
"train_batch_size": 128,
"trial_name": null,
"trial_params": null
}