|
{ |
|
"best_metric": 0.8772656654583117, |
|
"best_model_checkpoint": "swin-base-patch4-window7-224-in22k-cons_Classification_base_V10/checkpoint-105", |
|
"epoch": 6.885245901639344, |
|
"eval_steps": 500, |
|
"global_step": 105, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.6557377049180327, |
|
"grad_norm": 4.642137050628662, |
|
"learning_rate": 4.545454545454546e-05, |
|
"loss": 0.7975, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.9836065573770492, |
|
"step": 15, |
|
"train_accuracy": 0.8178880703114902, |
|
"train_auc_class_0": 0.8980438574304173, |
|
"train_auc_class_1": 0.9139826205363317, |
|
"train_auc_class_2": 0.8919882412630196, |
|
"train_auc_overall": 0.9013382397432562, |
|
"train_loss": 0.46714112162590027, |
|
"train_runtime": 689.8789, |
|
"train_samples_per_second": 11.215, |
|
"train_steps_per_second": 0.088 |
|
}, |
|
{ |
|
"epoch": 0.9836065573770492, |
|
"eval_accuracy": 0.8524080787156914, |
|
"eval_auc_class_0": 0.9181721665274296, |
|
"eval_auc_class_1": 0.9324510717614166, |
|
"eval_auc_class_2": 0.9299151491872829, |
|
"eval_auc_overall": 0.9268461291587097, |
|
"eval_loss": 0.4173153042793274, |
|
"eval_runtime": 342.4588, |
|
"eval_samples_per_second": 5.639, |
|
"eval_steps_per_second": 0.047, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 1.3114754098360657, |
|
"grad_norm": 2.1029186248779297, |
|
"learning_rate": 4.5212765957446815e-05, |
|
"loss": 0.5023, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 1.9672131147540983, |
|
"grad_norm": 1.8800333738327026, |
|
"learning_rate": 3.9893617021276594e-05, |
|
"loss": 0.4094, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 1.9672131147540983, |
|
"step": 30, |
|
"train_accuracy": 0.8503295851105079, |
|
"train_auc_class_0": 0.9326458902508805, |
|
"train_auc_class_1": 0.9445850486238231, |
|
"train_auc_class_2": 0.9445771168575358, |
|
"train_auc_overall": 0.9406026852440799, |
|
"train_loss": 0.3614955544471741, |
|
"train_runtime": 693.803, |
|
"train_samples_per_second": 11.152, |
|
"train_steps_per_second": 0.088 |
|
}, |
|
{ |
|
"epoch": 1.9672131147540983, |
|
"eval_accuracy": 0.849818746763335, |
|
"eval_auc_class_0": 0.9336946035724231, |
|
"eval_auc_class_1": 0.9488809233636819, |
|
"eval_auc_class_2": 0.9534673603715279, |
|
"eval_auc_overall": 0.9453476291025443, |
|
"eval_loss": 0.3673703968524933, |
|
"eval_runtime": 266.4299, |
|
"eval_samples_per_second": 7.248, |
|
"eval_steps_per_second": 0.06, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 2.6229508196721314, |
|
"grad_norm": 2.8551852703094482, |
|
"learning_rate": 3.4574468085106386e-05, |
|
"loss": 0.3672, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 2.9508196721311473, |
|
"step": 45, |
|
"train_accuracy": 0.864417732971436, |
|
"train_auc_class_0": 0.9455359129962017, |
|
"train_auc_class_1": 0.9545585538591823, |
|
"train_auc_class_2": 0.9593322426521459, |
|
"train_auc_overall": 0.9531422365025098, |
|
"train_loss": 0.32408276200294495, |
|
"train_runtime": 685.3567, |
|
"train_samples_per_second": 11.289, |
|
"train_steps_per_second": 0.089 |
|
}, |
|
{ |
|
"epoch": 2.9508196721311473, |
|
"eval_accuracy": 0.8726048679440704, |
|
"eval_auc_class_0": 0.9429575923936826, |
|
"eval_auc_class_1": 0.9536497239945516, |
|
"eval_auc_class_2": 0.9603724007891477, |
|
"eval_auc_overall": 0.9523265723924607, |
|
"eval_loss": 0.3238150477409363, |
|
"eval_runtime": 204.7854, |
|
"eval_samples_per_second": 9.429, |
|
"eval_steps_per_second": 0.078, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 3.278688524590164, |
|
"grad_norm": 2.7802083492279053, |
|
"learning_rate": 2.925531914893617e-05, |
|
"loss": 0.3328, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 3.9344262295081966, |
|
"grad_norm": 2.6021904945373535, |
|
"learning_rate": 2.393617021276596e-05, |
|
"loss": 0.3237, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"step": 61, |
|
"train_accuracy": 0.8729481711257593, |
|
"train_auc_class_0": 0.9494105682362736, |
|
"train_auc_class_1": 0.960331196185584, |
|
"train_auc_class_2": 0.9563328693868581, |
|
"train_auc_overall": 0.955358211269572, |
|
"train_loss": 0.31062838435173035, |
|
"train_runtime": 681.8052, |
|
"train_samples_per_second": 11.348, |
|
"train_steps_per_second": 0.089 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8720870015535992, |
|
"eval_auc_class_0": 0.9470949198392808, |
|
"eval_auc_class_1": 0.9577675819055128, |
|
"eval_auc_class_2": 0.961633814620179, |
|
"eval_auc_overall": 0.9554987721216577, |
|
"eval_loss": 0.32258161902427673, |
|
"eval_runtime": 204.0189, |
|
"eval_samples_per_second": 9.465, |
|
"eval_steps_per_second": 0.078, |
|
"step": 61 |
|
}, |
|
{ |
|
"epoch": 4.590163934426229, |
|
"grad_norm": 2.246328592300415, |
|
"learning_rate": 1.8617021276595745e-05, |
|
"loss": 0.3257, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 4.983606557377049, |
|
"step": 76, |
|
"train_accuracy": 0.879798371461807, |
|
"train_auc_class_0": 0.9544922319365635, |
|
"train_auc_class_1": 0.9627755801666535, |
|
"train_auc_class_2": 0.9628861811778814, |
|
"train_auc_overall": 0.9600513310936994, |
|
"train_loss": 0.29983675479888916, |
|
"train_runtime": 688.2036, |
|
"train_samples_per_second": 11.242, |
|
"train_steps_per_second": 0.089 |
|
}, |
|
{ |
|
"epoch": 4.983606557377049, |
|
"eval_accuracy": 0.8741584671154842, |
|
"eval_auc_class_0": 0.9478719119226638, |
|
"eval_auc_class_1": 0.9577360384256937, |
|
"eval_auc_class_2": 0.9608001466557257, |
|
"eval_auc_overall": 0.9554693656680278, |
|
"eval_loss": 0.32330793142318726, |
|
"eval_runtime": 205.4973, |
|
"eval_samples_per_second": 9.397, |
|
"eval_steps_per_second": 0.078, |
|
"step": 76 |
|
}, |
|
{ |
|
"epoch": 5.245901639344262, |
|
"grad_norm": 1.7804102897644043, |
|
"learning_rate": 1.3297872340425532e-05, |
|
"loss": 0.2972, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 5.901639344262295, |
|
"grad_norm": 1.6500009298324585, |
|
"learning_rate": 7.97872340425532e-06, |
|
"loss": 0.2923, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 5.967213114754099, |
|
"step": 91, |
|
"train_accuracy": 0.8857438283572444, |
|
"train_auc_class_0": 0.9581288331197666, |
|
"train_auc_class_1": 0.966850418082771, |
|
"train_auc_class_2": 0.9694481750082071, |
|
"train_auc_overall": 0.9648091420702481, |
|
"train_loss": 0.28071513772010803, |
|
"train_runtime": 686.7084, |
|
"train_samples_per_second": 11.267, |
|
"train_steps_per_second": 0.089 |
|
}, |
|
{ |
|
"epoch": 5.967213114754099, |
|
"eval_accuracy": 0.8736406007250129, |
|
"eval_auc_class_0": 0.9477737001233243, |
|
"eval_auc_class_1": 0.9590063803856907, |
|
"eval_auc_class_2": 0.9627250030553275, |
|
"eval_auc_overall": 0.9565016945214474, |
|
"eval_loss": 0.3128957450389862, |
|
"eval_runtime": 206.0937, |
|
"eval_samples_per_second": 9.37, |
|
"eval_steps_per_second": 0.078, |
|
"step": 91 |
|
}, |
|
{ |
|
"epoch": 6.557377049180328, |
|
"grad_norm": 2.4247124195098877, |
|
"learning_rate": 2.6595744680851065e-06, |
|
"loss": 0.2794, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 6.885245901639344, |
|
"step": 105, |
|
"train_accuracy": 0.8973762440222308, |
|
"train_auc_class_0": 0.9638374809913217, |
|
"train_auc_class_1": 0.9706794670135619, |
|
"train_auc_class_2": 0.9722462334871682, |
|
"train_auc_overall": 0.9689210604973506, |
|
"train_loss": 0.26410263776779175, |
|
"train_runtime": 684.8081, |
|
"train_samples_per_second": 11.298, |
|
"train_steps_per_second": 0.089 |
|
}, |
|
{ |
|
"epoch": 6.885245901639344, |
|
"eval_accuracy": 0.8772656654583117, |
|
"eval_auc_class_0": 0.9495477284481044, |
|
"eval_auc_class_1": 0.9596716610509716, |
|
"eval_auc_class_2": 0.9626115194580721, |
|
"eval_auc_overall": 0.9572769696523826, |
|
"eval_loss": 0.30786964297294617, |
|
"eval_runtime": 205.1702, |
|
"eval_samples_per_second": 9.412, |
|
"eval_steps_per_second": 0.078, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 6.885245901639344, |
|
"step": 105, |
|
"total_flos": 4.1785312376666235e+18, |
|
"train_loss": 0.38806929134187246, |
|
"train_runtime": 12116.6555, |
|
"train_samples_per_second": 4.47, |
|
"train_steps_per_second": 0.009 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 105, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 7, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 4.1785312376666235e+18, |
|
"train_batch_size": 128, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|