File size: 2,281 Bytes
d8e9335 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 20.337552742616033,
"global_step": 2400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 3.39,
"learning_rate": 0.00023999999999999998,
"loss": 6.3317,
"step": 400
},
{
"epoch": 3.39,
"eval_loss": 3.161163806915283,
"eval_runtime": 205.0119,
"eval_samples_per_second": 8.687,
"eval_wer": 1.0,
"step": 400
},
{
"epoch": 6.78,
"learning_rate": 0.0002703947368421052,
"loss": 1.6739,
"step": 800
},
{
"epoch": 6.78,
"eval_loss": 0.6274727582931519,
"eval_runtime": 205.8605,
"eval_samples_per_second": 8.651,
"eval_wer": 1.008992553042012,
"step": 800
},
{
"epoch": 10.17,
"learning_rate": 0.00023092105263157893,
"loss": 0.3726,
"step": 1200
},
{
"epoch": 10.17,
"eval_loss": 0.6007506847381592,
"eval_runtime": 208.514,
"eval_samples_per_second": 8.541,
"eval_wer": 0.9197695658282984,
"step": 1200
},
{
"epoch": 13.56,
"learning_rate": 0.00019144736842105262,
"loss": 0.2323,
"step": 1600
},
{
"epoch": 13.56,
"eval_loss": 0.62809157371521,
"eval_runtime": 207.5386,
"eval_samples_per_second": 8.582,
"eval_wer": 0.9513840101166222,
"step": 1600
},
{
"epoch": 16.95,
"learning_rate": 0.00015197368421052628,
"loss": 0.1598,
"step": 2000
},
{
"epoch": 16.95,
"eval_loss": 0.679410994052887,
"eval_runtime": 213.3742,
"eval_samples_per_second": 8.347,
"eval_wer": 0.8642686525221301,
"step": 2000
},
{
"epoch": 20.34,
"learning_rate": 0.0001125,
"loss": 0.1258,
"step": 2400
},
{
"epoch": 20.34,
"eval_loss": 0.7365503311157227,
"eval_runtime": 210.0426,
"eval_samples_per_second": 8.479,
"eval_wer": 0.8294225094843333,
"step": 2400
}
],
"max_steps": 3540,
"num_train_epochs": 30,
"total_flos": 1.022364819420586e+19,
"trial_name": null,
"trial_params": null
}
|