|
{"current_steps": 5, "total_steps": 105, "loss": 4.3219, "lr": 4.972077065562821e-05, "epoch": 0.1413427561837456, "percentage": 4.76, "elapsed_time": "0:02:26", "remaining_time": "0:48:48", "throughput": 610.23, "total_tokens": 89360} |
|
{"current_steps": 10, "total_steps": 105, "loss": 2.7795, "lr": 4.888932014465352e-05, "epoch": 0.2826855123674912, "percentage": 9.52, "elapsed_time": "0:04:37", "remaining_time": "0:43:57", "throughput": 625.65, "total_tokens": 173680} |
|
{"current_steps": 15, "total_steps": 105, "loss": 3.1788, "lr": 4.783863644106502e-05, "epoch": 0.42402826855123676, "percentage": 14.29, "elapsed_time": "0:06:45", "remaining_time": "0:40:35", "throughput": 631.57, "total_tokens": 256320} |
|
{"current_steps": 20, "total_steps": 105, "loss": 2.8887, "lr": 4.606802396635098e-05, "epoch": 0.5653710247349824, "percentage": 19.05, "elapsed_time": "0:09:21", "remaining_time": "0:39:46", "throughput": 630.67, "total_tokens": 354080} |
|
{"current_steps": 25, "total_steps": 105, "loss": 2.5454, "lr": 4.382678665009028e-05, "epoch": 0.7067137809187279, "percentage": 23.81, "elapsed_time": "0:11:44", "remaining_time": "0:37:34", "throughput": 631.72, "total_tokens": 445120} |
|
{"current_steps": 30, "total_steps": 105, "loss": 2.201, "lr": 4.116499003039499e-05, "epoch": 0.8480565371024735, "percentage": 28.57, "elapsed_time": "0:14:07", "remaining_time": "0:35:19", "throughput": 632.41, "total_tokens": 536160} |
|
{"current_steps": 35, "total_steps": 105, "loss": 1.3345, "lr": 3.814209424526262e-05, "epoch": 0.9893992932862191, "percentage": 33.33, "elapsed_time": "0:16:26", "remaining_time": "0:32:52", "throughput": 630.92, "total_tokens": 622160} |
|
{"current_steps": 40, "total_steps": 105, "loss": 0.9507, "lr": 3.4825625791348096e-05, "epoch": 1.1130742049469964, "percentage": 38.1, "elapsed_time": "0:18:33", "remaining_time": "0:30:09", "throughput": 631.24, "total_tokens": 702992} |
|
{"current_steps": 45, "total_steps": 105, "loss": 0.6257, "lr": 3.1289669093612714e-05, "epoch": 1.254416961130742, "percentage": 42.86, "elapsed_time": "0:20:59", "remaining_time": "0:27:59", "throughput": 631.56, "total_tokens": 795712} |
|
{"current_steps": 50, "total_steps": 105, "loss": 1.9766, "lr": 2.761321158169134e-05, "epoch": 1.3957597173144876, "percentage": 47.62, "elapsed_time": "0:23:18", "remaining_time": "0:25:38", "throughput": 629.2, "total_tokens": 880032} |
|
{"current_steps": 55, "total_steps": 105, "loss": 1.0377, "lr": 2.3878379241237136e-05, "epoch": 1.5371024734982333, "percentage": 52.38, "elapsed_time": "0:25:40", "remaining_time": "0:23:20", "throughput": 629.38, "total_tokens": 969392} |
|
{"current_steps": 60, "total_steps": 105, "loss": 1.5486, "lr": 2.0168602055111173e-05, "epoch": 1.6784452296819787, "percentage": 57.14, "elapsed_time": "0:28:08", "remaining_time": "0:21:06", "throughput": 627.11, "total_tokens": 1058752} |
|
{"current_steps": 65, "total_steps": 105, "loss": 0.7542, "lr": 1.6566750315429254e-05, "epoch": 1.8197879858657244, "percentage": 61.9, "elapsed_time": "0:30:19", "remaining_time": "0:18:39", "throughput": 628.22, "total_tokens": 1143072} |
|
{"current_steps": 70, "total_steps": 105, "loss": 0.7561, "lr": 1.3153283438175034e-05, "epoch": 1.96113074204947, "percentage": 66.67, "elapsed_time": "0:32:42", "remaining_time": "0:16:21", "throughput": 628.73, "total_tokens": 1234112} |
|
{"current_steps": 75, "total_steps": 105, "loss": 0.73, "lr": 1.0004452632802158e-05, "epoch": 2.0848056537102475, "percentage": 71.43, "elapsed_time": "0:34:29", "remaining_time": "0:13:47", "throughput": 629.72, "total_tokens": 1303184} |
|
{"current_steps": 80, "total_steps": 105, "loss": 0.5124, "lr": 7.190597576216385e-06, "epoch": 2.2261484098939928, "percentage": 76.19, "elapsed_time": "0:36:37", "remaining_time": "0:11:26", "throughput": 630.55, "total_tokens": 1385824} |
|
{"current_steps": 85, "total_steps": 105, "loss": 0.7801, "lr": 4.7745751406263165e-06, "epoch": 2.3674911660777385, "percentage": 80.95, "elapsed_time": "0:39:01", "remaining_time": "0:09:10", "throughput": 630.83, "total_tokens": 1476864} |
|
{"current_steps": 90, "total_steps": 105, "loss": 0.3849, "lr": 2.8103552748861476e-06, "epoch": 2.508833922261484, "percentage": 85.71, "elapsed_time": "0:41:35", "remaining_time": "0:06:55", "throughput": 629.03, "total_tokens": 1569584} |
|
{"current_steps": 95, "total_steps": 105, "loss": 0.4539, "lr": 1.3418154050208936e-06, "epoch": 2.65017667844523, "percentage": 90.48, "elapsed_time": "0:43:52", "remaining_time": "0:04:37", "throughput": 629.45, "total_tokens": 1657264} |
|
{"current_steps": 100, "total_steps": 105, "loss": 1.1474, "lr": 4.0176028503425835e-07, "epoch": 2.791519434628975, "percentage": 95.24, "elapsed_time": "0:46:17", "remaining_time": "0:02:18", "throughput": 628.9, "total_tokens": 1746624} |
|
{"current_steps": 105, "total_steps": 105, "loss": 0.7139, "lr": 1.1189192912416934e-08, "epoch": 2.932862190812721, "percentage": 100.0, "elapsed_time": "0:48:51", "remaining_time": "0:00:00", "throughput": 627.96, "total_tokens": 1841024} |
|
{"current_steps": 105, "total_steps": 105, "epoch": 2.932862190812721, "percentage": 100.0, "elapsed_time": "0:48:53", "remaining_time": "0:00:00", "throughput": 627.67, "total_tokens": 1841024} |
|
|