Jeckmu's picture
Upload folder using huggingface_hub
1663891 verified
{"current_steps": 5, "total_steps": 105, "loss": 4.4182, "lr": 4.9821173158545936e-05, "epoch": 0.1413427561837456, "percentage": 4.76, "elapsed_time": "0:03:21", "remaining_time": "1:07:01", "throughput": 444.43, "total_tokens": 89360}
{"current_steps": 10, "total_steps": 105, "loss": 2.2953, "lr": 4.928725095732169e-05, "epoch": 0.2826855123674912, "percentage": 9.52, "elapsed_time": "0:06:22", "remaining_time": "1:00:33", "throughput": 454.06, "total_tokens": 173680}
{"current_steps": 15, "total_steps": 105, "loss": 2.6132, "lr": 4.813260751184992e-05, "epoch": 0.42402826855123676, "percentage": 14.29, "elapsed_time": "0:09:20", "remaining_time": "0:56:00", "throughput": 457.68, "total_tokens": 256320}
{"current_steps": 20, "total_steps": 105, "loss": 2.6473, "lr": 4.6461219840046654e-05, "epoch": 0.5653710247349824, "percentage": 19.05, "elapsed_time": "0:12:53", "remaining_time": "0:54:46", "throughput": 457.95, "total_tokens": 354080}
{"current_steps": 25, "total_steps": 105, "loss": 1.9798, "lr": 4.431042398061499e-05, "epoch": 0.7067137809187279, "percentage": 23.81, "elapsed_time": "0:16:10", "remaining_time": "0:51:44", "throughput": 458.77, "total_tokens": 445120}
{"current_steps": 30, "total_steps": 105, "loss": 1.6494, "lr": 4.172826515897146e-05, "epoch": 0.8480565371024735, "percentage": 28.57, "elapsed_time": "0:19:27", "remaining_time": "0:48:38", "throughput": 459.28, "total_tokens": 536160}
{"current_steps": 35, "total_steps": 105, "loss": 1.2652, "lr": 3.8772424536302564e-05, "epoch": 0.9893992932862191, "percentage": 33.33, "elapsed_time": "0:22:36", "remaining_time": "0:45:13", "throughput": 458.59, "total_tokens": 622160}
{"current_steps": 40, "total_steps": 105, "loss": 1.1679, "lr": 3.550893070773914e-05, "epoch": 1.1130742049469964, "percentage": 38.1, "elapsed_time": "0:25:32", "remaining_time": "0:41:31", "throughput": 458.57, "total_tokens": 702992}
{"current_steps": 45, "total_steps": 105, "loss": 0.7785, "lr": 3.201068473265007e-05, "epoch": 1.254416961130742, "percentage": 42.86, "elapsed_time": "0:28:53", "remaining_time": "0:38:31", "throughput": 458.89, "total_tokens": 795712}
{"current_steps": 50, "total_steps": 105, "loss": 1.3648, "lr": 2.8355831645441388e-05, "epoch": 1.3957597173144876, "percentage": 47.62, "elapsed_time": "0:32:02", "remaining_time": "0:35:15", "throughput": 457.64, "total_tokens": 880032}
{"current_steps": 55, "total_steps": 105, "loss": 1.1121, "lr": 2.4626014824618415e-05, "epoch": 1.5371024734982333, "percentage": 52.38, "elapsed_time": "0:35:18", "remaining_time": "0:32:05", "throughput": 457.57, "total_tokens": 969392}
{"current_steps": 60, "total_steps": 105, "loss": 1.1847, "lr": 2.090455221462156e-05, "epoch": 1.6784452296819787, "percentage": 57.14, "elapsed_time": "0:38:39", "remaining_time": "0:28:59", "throughput": 456.4, "total_tokens": 1058752}
{"current_steps": 65, "total_steps": 105, "loss": 0.4018, "lr": 1.7274575140626318e-05, "epoch": 1.8197879858657244, "percentage": 61.9, "elapsed_time": "0:41:41", "remaining_time": "0:25:39", "throughput": 456.99, "total_tokens": 1143072}
{"current_steps": 70, "total_steps": 105, "loss": 0.7509, "lr": 1.3817171292109183e-05, "epoch": 1.96113074204947, "percentage": 66.67, "elapsed_time": "0:44:58", "remaining_time": "0:22:29", "throughput": 457.33, "total_tokens": 1234112}
{"current_steps": 75, "total_steps": 105, "loss": 0.46, "lr": 1.0609573357858166e-05, "epoch": 2.0848056537102475, "percentage": 71.43, "elapsed_time": "0:47:27", "remaining_time": "0:18:58", "throughput": 457.74, "total_tokens": 1303184}
{"current_steps": 80, "total_steps": 105, "loss": 0.4216, "lr": 7.723433775328384e-06, "epoch": 2.2261484098939928, "percentage": 76.19, "elapsed_time": "0:50:24", "remaining_time": "0:15:45", "throughput": 458.16, "total_tokens": 1385824}
{"current_steps": 85, "total_steps": 105, "loss": 0.5816, "lr": 5.223224133591476e-06, "epoch": 2.3674911660777385, "percentage": 80.95, "elapsed_time": "0:53:42", "remaining_time": "0:12:38", "throughput": 458.34, "total_tokens": 1476864}
{"current_steps": 90, "total_steps": 105, "loss": 0.4955, "lr": 3.164794984571759e-06, "epoch": 2.508833922261484, "percentage": 85.71, "elapsed_time": "0:57:11", "remaining_time": "0:09:31", "throughput": 457.37, "total_tokens": 1569584}
{"current_steps": 95, "total_steps": 105, "loss": 0.2691, "lr": 1.59412823400657e-06, "epoch": 2.65017667844523, "percentage": 90.48, "elapsed_time": "1:00:22", "remaining_time": "0:06:21", "throughput": 457.51, "total_tokens": 1657264}
{"current_steps": 100, "total_steps": 105, "loss": 1.1078, "lr": 5.463099816548579e-07, "epoch": 2.791519434628975, "percentage": 95.24, "elapsed_time": "1:03:40", "remaining_time": "0:03:11", "throughput": 457.2, "total_tokens": 1746624}
{"current_steps": 105, "total_steps": 105, "loss": 0.6358, "lr": 4.474675580662113e-08, "epoch": 2.932862190812721, "percentage": 100.0, "elapsed_time": "1:07:11", "remaining_time": "0:00:00", "throughput": 456.62, "total_tokens": 1841024}
{"current_steps": 105, "total_steps": 105, "epoch": 2.932862190812721, "percentage": 100.0, "elapsed_time": "1:07:13", "remaining_time": "0:00:00", "throughput": 456.44, "total_tokens": 1841024}