|
{ |
|
"best_metric": 27.250397341424648, |
|
"best_model_checkpoint": "./checkpoint-50", |
|
"epoch": 99.01, |
|
"global_step": 200, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 12.01, |
|
"learning_rate": 9.210526315789473e-07, |
|
"loss": 0.752, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 24.01, |
|
"learning_rate": 7.947368421052631e-07, |
|
"loss": 0.425, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 24.01, |
|
"eval_loss": 0.4105507731437683, |
|
"eval_runtime": 786.9933, |
|
"eval_samples_per_second": 1.006, |
|
"eval_steps_per_second": 0.032, |
|
"eval_wer": 27.250397341424648, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 37.01, |
|
"learning_rate": 6.63157894736842e-07, |
|
"loss": 0.2879, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 49.01, |
|
"learning_rate": 5.31578947368421e-07, |
|
"loss": 0.1906, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 49.01, |
|
"eval_loss": 0.44195765256881714, |
|
"eval_runtime": 813.6355, |
|
"eval_samples_per_second": 0.973, |
|
"eval_steps_per_second": 0.031, |
|
"eval_wer": 29.013148388961135, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 62.01, |
|
"learning_rate": 4e-07, |
|
"loss": 0.1347, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 74.01, |
|
"learning_rate": 2.684210526315789e-07, |
|
"loss": 0.0982, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 74.01, |
|
"eval_loss": 0.4795360267162323, |
|
"eval_runtime": 848.8397, |
|
"eval_samples_per_second": 0.933, |
|
"eval_steps_per_second": 0.029, |
|
"eval_wer": 30.306314116457163, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"learning_rate": 1.368421052631579e-07, |
|
"loss": 0.0829, |
|
"step": 175 |
|
}, |
|
{ |
|
"epoch": 99.01, |
|
"learning_rate": 5.263157894736842e-09, |
|
"loss": 0.0717, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 99.01, |
|
"eval_loss": 0.4944527745246887, |
|
"eval_runtime": 875.6338, |
|
"eval_samples_per_second": 0.904, |
|
"eval_steps_per_second": 0.029, |
|
"eval_wer": 30.891489669122958, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 99.01, |
|
"step": 200, |
|
"total_flos": 1.387640884064256e+20, |
|
"train_loss": 0.25535590410232545, |
|
"train_runtime": 48457.1181, |
|
"train_samples_per_second": 2.113, |
|
"train_steps_per_second": 0.004 |
|
} |
|
], |
|
"max_steps": 200, |
|
"num_train_epochs": 9223372036854775807, |
|
"total_flos": 1.387640884064256e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|