{"current_steps": 50, "total_steps": 30076, "loss": 5.822, "learning_rate": 1.6622340425531915e-06, "epoch": 0.0033247444102734603, "percentage": 0.17, "elapsed_time": "0:05:53", "remaining_time": "2 days, 10:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 30076, "loss": 5.9169, "learning_rate": 3.324468085106383e-06, "epoch": 0.006649488820546921, "percentage": 0.33, "elapsed_time": "0:12:10", "remaining_time": "2 days, 12:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 30076, "loss": 5.2194, "learning_rate": 4.986702127659574e-06, "epoch": 0.009974233230820381, "percentage": 0.5, "elapsed_time": "0:17:51", "remaining_time": "2 days, 11:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 30076, "loss": 4.452, "learning_rate": 6.648936170212766e-06, "epoch": 0.013298977641093841, "percentage": 0.66, "elapsed_time": "0:24:23", "remaining_time": "2 days, 12:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 30076, "loss": 3.6432, "learning_rate": 8.311170212765958e-06, "epoch": 0.0166237220513673, "percentage": 0.83, "elapsed_time": "0:30:08", "remaining_time": "2 days, 11:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 30076, "loss": 3.174, "learning_rate": 9.973404255319148e-06, "epoch": 0.019948466461640762, "percentage": 1.0, "elapsed_time": "0:36:21", "remaining_time": "2 days, 12:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 30076, "loss": 2.5593, "learning_rate": 1.1635638297872341e-05, "epoch": 0.02327321087191422, "percentage": 1.16, "elapsed_time": "0:42:47", "remaining_time": "2 days, 12:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 30076, "loss": 2.1801, "learning_rate": 1.3297872340425532e-05, "epoch": 0.026597955282187682, "percentage": 1.33, "elapsed_time": "0:49:04", "remaining_time": "2 days, 12:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 30076, "loss": 1.8083, "learning_rate": 1.4960106382978726e-05, "epoch": 0.02992269969246114, "percentage": 1.5, "elapsed_time": "0:55:24", "remaining_time": "2 days, 12:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 30076, "loss": 1.6401, "learning_rate": 1.6622340425531915e-05, "epoch": 0.0332474441027346, "percentage": 1.66, "elapsed_time": "1:01:51", "remaining_time": "2 days, 12:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 30076, "loss": 1.5832, "learning_rate": 1.8284574468085108e-05, "epoch": 0.036572188513008065, "percentage": 1.83, "elapsed_time": "1:07:54", "remaining_time": "2 days, 12:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 30076, "loss": 1.4445, "learning_rate": 1.9946808510638297e-05, "epoch": 0.039896932923281524, "percentage": 1.99, "elapsed_time": "1:14:02", "remaining_time": "2 days, 12:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 30076, "loss": 1.3488, "learning_rate": 2.1609042553191493e-05, "epoch": 0.04322167733355498, "percentage": 2.16, "elapsed_time": "1:20:38", "remaining_time": "2 days, 12:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 30076, "loss": 1.2645, "learning_rate": 2.3271276595744682e-05, "epoch": 0.04654642174382844, "percentage": 2.33, "elapsed_time": "1:26:34", "remaining_time": "2 days, 12:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 30076, "loss": 1.2705, "learning_rate": 2.4933510638297874e-05, "epoch": 0.049871166154101906, "percentage": 2.49, "elapsed_time": "1:32:51", "remaining_time": "2 days, 12:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 30076, "loss": 1.1177, "learning_rate": 2.6595744680851064e-05, "epoch": 0.053195910564375365, "percentage": 2.66, "elapsed_time": "1:39:26", "remaining_time": "2 days, 12:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 30076, "loss": 1.1117, "learning_rate": 2.8257978723404256e-05, "epoch": 0.056520654974648823, "percentage": 2.83, "elapsed_time": "1:45:26", "remaining_time": "2 days, 12:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 30076, "loss": 1.0738, "learning_rate": 2.9920212765957452e-05, "epoch": 0.05984539938492228, "percentage": 2.99, "elapsed_time": "1:52:01", "remaining_time": "2 days, 12:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 30076, "loss": 0.9417, "learning_rate": 3.158244680851064e-05, "epoch": 0.06317014379519574, "percentage": 3.16, "elapsed_time": "1:58:22", "remaining_time": "2 days, 12:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 30076, "loss": 0.9209, "learning_rate": 3.324468085106383e-05, "epoch": 0.0664948882054692, "percentage": 3.32, "elapsed_time": "2:04:33", "remaining_time": "2 days, 12:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 30076, "loss": 0.923, "learning_rate": 3.490691489361702e-05, "epoch": 0.06981963261574267, "percentage": 3.49, "elapsed_time": "2:10:58", "remaining_time": "2 days, 12:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 30076, "loss": 0.8675, "learning_rate": 3.6569148936170215e-05, "epoch": 0.07314437702601613, "percentage": 3.66, "elapsed_time": "2:17:27", "remaining_time": "2 days, 12:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 30076, "loss": 0.8474, "learning_rate": 3.823138297872341e-05, "epoch": 0.07646912143628959, "percentage": 3.82, "elapsed_time": "2:23:49", "remaining_time": "2 days, 12:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 30076, "loss": 0.9049, "learning_rate": 3.9893617021276594e-05, "epoch": 0.07979386584656305, "percentage": 3.99, "elapsed_time": "2:29:53", "remaining_time": "2 days, 12:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 30076, "loss": 0.8135, "learning_rate": 4.1555851063829786e-05, "epoch": 0.0831186102568365, "percentage": 4.16, "elapsed_time": "2:36:12", "remaining_time": "2 days, 12:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 30076, "loss": 0.8804, "learning_rate": 4.3218085106382986e-05, "epoch": 0.08644335466710996, "percentage": 4.32, "elapsed_time": "2:42:56", "remaining_time": "2 days, 12:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 30076, "loss": 0.8195, "learning_rate": 4.488031914893617e-05, "epoch": 0.08976809907738342, "percentage": 4.49, "elapsed_time": "2:48:51", "remaining_time": "2 days, 11:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 30076, "loss": 0.7564, "learning_rate": 4.6542553191489364e-05, "epoch": 0.09309284348765688, "percentage": 4.65, "elapsed_time": "2:54:50", "remaining_time": "2 days, 11:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 30076, "loss": 0.8551, "learning_rate": 4.8204787234042556e-05, "epoch": 0.09641758789793034, "percentage": 4.82, "elapsed_time": "3:01:13", "remaining_time": "2 days, 11:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 30076, "loss": 0.7798, "learning_rate": 4.986702127659575e-05, "epoch": 0.09974233230820381, "percentage": 4.99, "elapsed_time": "3:07:46", "remaining_time": "2 days, 11:37:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 30076, "loss": 0.7384, "learning_rate": 5.152925531914894e-05, "epoch": 0.10306707671847727, "percentage": 5.15, "elapsed_time": "3:13:41", "remaining_time": "2 days, 11:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 30076, "loss": 0.792, "learning_rate": 5.319148936170213e-05, "epoch": 0.10639182112875073, "percentage": 5.32, "elapsed_time": "3:20:04", "remaining_time": "2 days, 11:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 30076, "loss": 0.7462, "learning_rate": 5.485372340425532e-05, "epoch": 0.10971656553902419, "percentage": 5.49, "elapsed_time": "3:26:26", "remaining_time": "2 days, 11:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 30076, "loss": 0.7477, "learning_rate": 5.651595744680851e-05, "epoch": 0.11304130994929765, "percentage": 5.65, "elapsed_time": "3:32:30", "remaining_time": "2 days, 11:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 30076, "loss": 0.6861, "learning_rate": 5.81781914893617e-05, "epoch": 0.1163660543595711, "percentage": 5.82, "elapsed_time": "3:38:12", "remaining_time": "2 days, 10:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 30076, "loss": 0.7214, "learning_rate": 5.9840425531914904e-05, "epoch": 0.11969079876984456, "percentage": 5.98, "elapsed_time": "3:44:29", "remaining_time": "2 days, 10:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 30076, "loss": 0.6917, "learning_rate": 6.150265957446809e-05, "epoch": 0.12301554318011802, "percentage": 6.15, "elapsed_time": "3:50:54", "remaining_time": "2 days, 10:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 30076, "loss": 0.6948, "learning_rate": 6.316489361702128e-05, "epoch": 0.12634028759039148, "percentage": 6.32, "elapsed_time": "3:57:06", "remaining_time": "2 days, 10:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 30076, "loss": 0.7296, "learning_rate": 6.482712765957447e-05, "epoch": 0.12966503200066495, "percentage": 6.48, "elapsed_time": "4:02:57", "remaining_time": "2 days, 10:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 30076, "loss": 0.732, "learning_rate": 6.648936170212766e-05, "epoch": 0.1329897764109384, "percentage": 6.65, "elapsed_time": "4:09:00", "remaining_time": "2 days, 10:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 30076, "loss": 0.6978, "learning_rate": 6.815159574468085e-05, "epoch": 0.13631452082121187, "percentage": 6.82, "elapsed_time": "4:15:11", "remaining_time": "2 days, 10:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 30076, "loss": 0.7093, "learning_rate": 6.981382978723405e-05, "epoch": 0.13963926523148534, "percentage": 6.98, "elapsed_time": "4:21:29", "remaining_time": "2 days, 10:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 30076, "loss": 0.7114, "learning_rate": 7.147606382978723e-05, "epoch": 0.1429640096417588, "percentage": 7.15, "elapsed_time": "4:27:08", "remaining_time": "2 days, 9:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 30076, "loss": 0.7156, "learning_rate": 7.313829787234043e-05, "epoch": 0.14628875405203226, "percentage": 7.31, "elapsed_time": "4:33:24", "remaining_time": "2 days, 9:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 30076, "loss": 0.6908, "learning_rate": 7.480053191489363e-05, "epoch": 0.1496134984623057, "percentage": 7.48, "elapsed_time": "4:39:34", "remaining_time": "2 days, 9:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 30076, "loss": 0.7239, "learning_rate": 7.646276595744682e-05, "epoch": 0.15293824287257918, "percentage": 7.65, "elapsed_time": "4:45:28", "remaining_time": "2 days, 9:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 30076, "loss": 0.7164, "learning_rate": 7.8125e-05, "epoch": 0.15626298728285262, "percentage": 7.81, "elapsed_time": "4:51:49", "remaining_time": "2 days, 9:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 30076, "loss": 0.7372, "learning_rate": 7.978723404255319e-05, "epoch": 0.1595877316931261, "percentage": 7.98, "elapsed_time": "4:58:10", "remaining_time": "2 days, 9:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 30076, "loss": 0.6838, "learning_rate": 8.144946808510639e-05, "epoch": 0.16291247610339954, "percentage": 8.15, "elapsed_time": "5:04:47", "remaining_time": "2 days, 9:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 30076, "loss": 0.6905, "learning_rate": 8.311170212765957e-05, "epoch": 0.166237220513673, "percentage": 8.31, "elapsed_time": "5:11:04", "remaining_time": "2 days, 9:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 30076, "loss": 0.6824, "learning_rate": 8.477393617021277e-05, "epoch": 0.16956196492394648, "percentage": 8.48, "elapsed_time": "5:17:24", "remaining_time": "2 days, 9:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 30076, "loss": 0.6813, "learning_rate": 8.643617021276597e-05, "epoch": 0.17288670933421993, "percentage": 8.64, "elapsed_time": "5:23:32", "remaining_time": "2 days, 8:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 30076, "loss": 0.6849, "learning_rate": 8.809840425531916e-05, "epoch": 0.1762114537444934, "percentage": 8.81, "elapsed_time": "5:29:08", "remaining_time": "2 days, 8:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 30076, "loss": 0.6488, "learning_rate": 8.976063829787234e-05, "epoch": 0.17953619815476685, "percentage": 8.98, "elapsed_time": "5:35:22", "remaining_time": "2 days, 8:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 30076, "loss": 0.6468, "learning_rate": 9.142287234042554e-05, "epoch": 0.18286094256504032, "percentage": 9.14, "elapsed_time": "5:41:44", "remaining_time": "2 days, 8:35:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 30076, "loss": 0.6661, "learning_rate": 9.308510638297873e-05, "epoch": 0.18618568697531376, "percentage": 9.31, "elapsed_time": "5:47:53", "remaining_time": "2 days, 8:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 30076, "loss": 0.6519, "learning_rate": 9.474734042553191e-05, "epoch": 0.18951043138558724, "percentage": 9.48, "elapsed_time": "5:53:30", "remaining_time": "2 days, 8:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 30076, "loss": 0.6852, "learning_rate": 9.640957446808511e-05, "epoch": 0.19283517579586068, "percentage": 9.64, "elapsed_time": "6:00:26", "remaining_time": "2 days, 8:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 30076, "loss": 0.6286, "learning_rate": 9.807180851063831e-05, "epoch": 0.19615992020613415, "percentage": 9.81, "elapsed_time": "6:06:34", "remaining_time": "2 days, 8:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 30076, "loss": 0.7135, "learning_rate": 9.97340425531915e-05, "epoch": 0.19948466461640763, "percentage": 9.97, "elapsed_time": "6:12:50", "remaining_time": "2 days, 8:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 30076, "loss": 0.6312, "learning_rate": 9.999940594707412e-05, "epoch": 0.20280940902668107, "percentage": 10.14, "elapsed_time": "6:18:44", "remaining_time": "2 days, 7:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 30076, "loss": 0.651, "learning_rate": 9.999714964504067e-05, "epoch": 0.20613415343695454, "percentage": 10.31, "elapsed_time": "6:25:04", "remaining_time": "2 days, 7:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 30076, "loss": 0.6373, "learning_rate": 9.999320961690213e-05, "epoch": 0.209458897847228, "percentage": 10.47, "elapsed_time": "6:31:21", "remaining_time": "2 days, 7:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 30076, "loss": 0.7085, "learning_rate": 9.998758599534463e-05, "epoch": 0.21278364225750146, "percentage": 10.64, "elapsed_time": "6:37:22", "remaining_time": "2 days, 7:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 30076, "loss": 0.684, "learning_rate": 9.998027896975173e-05, "epoch": 0.2161083866677749, "percentage": 10.81, "elapsed_time": "6:43:47", "remaining_time": "2 days, 7:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 30076, "loss": 0.6139, "learning_rate": 9.997128878619808e-05, "epoch": 0.21943313107804838, "percentage": 10.97, "elapsed_time": "6:49:34", "remaining_time": "2 days, 7:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 30076, "loss": 0.6458, "learning_rate": 9.996061574744102e-05, "epoch": 0.22275787548832182, "percentage": 11.14, "elapsed_time": "6:55:54", "remaining_time": "2 days, 7:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 30076, "loss": 0.6125, "learning_rate": 9.994826021291056e-05, "epoch": 0.2260826198985953, "percentage": 11.3, "elapsed_time": "7:02:17", "remaining_time": "2 days, 7:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 30076, "loss": 0.6086, "learning_rate": 9.993422259869713e-05, "epoch": 0.22940736430886877, "percentage": 11.47, "elapsed_time": "7:08:09", "remaining_time": "2 days, 7:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 30076, "loss": 0.6516, "learning_rate": 9.991850337753762e-05, "epoch": 0.2327321087191422, "percentage": 11.64, "elapsed_time": "7:14:16", "remaining_time": "2 days, 6:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 30076, "loss": 0.5939, "learning_rate": 9.990110307879952e-05, "epoch": 0.23605685312941568, "percentage": 11.8, "elapsed_time": "7:20:35", "remaining_time": "2 days, 6:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 30076, "loss": 0.5968, "learning_rate": 9.988202228846291e-05, "epoch": 0.23938159753968913, "percentage": 11.97, "elapsed_time": "7:26:41", "remaining_time": "2 days, 6:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 30076, "loss": 0.6498, "learning_rate": 9.986126164910094e-05, "epoch": 0.2427063419499626, "percentage": 12.14, "elapsed_time": "7:32:54", "remaining_time": "2 days, 6:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 30076, "loss": 0.6477, "learning_rate": 9.983882185985808e-05, "epoch": 0.24603108636023605, "percentage": 12.3, "elapsed_time": "7:38:51", "remaining_time": "2 days, 6:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 30076, "loss": 0.6328, "learning_rate": 9.98147036764266e-05, "epoch": 0.24935583077050952, "percentage": 12.47, "elapsed_time": "7:44:52", "remaining_time": "2 days, 6:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 30076, "loss": 0.649, "learning_rate": 9.978890791102109e-05, "epoch": 0.25268057518078296, "percentage": 12.63, "elapsed_time": "7:50:34", "remaining_time": "2 days, 6:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 30076, "loss": 0.6618, "learning_rate": 9.976143543235114e-05, "epoch": 0.25600531959105643, "percentage": 12.8, "elapsed_time": "7:57:05", "remaining_time": "2 days, 6:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 30076, "loss": 0.6205, "learning_rate": 9.973228716559209e-05, "epoch": 0.2593300640013299, "percentage": 12.97, "elapsed_time": "8:03:51", "remaining_time": "2 days, 6:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 30076, "loss": 0.5935, "learning_rate": 9.970146409235386e-05, "epoch": 0.2626548084116034, "percentage": 13.13, "elapsed_time": "8:09:49", "remaining_time": "2 days, 5:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 30076, "loss": 0.596, "learning_rate": 9.966896725064786e-05, "epoch": 0.2659795528218768, "percentage": 13.3, "elapsed_time": "8:15:44", "remaining_time": "2 days, 5:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 30076, "loss": 0.6313, "learning_rate": 9.963479773485211e-05, "epoch": 0.26930429723215027, "percentage": 13.47, "elapsed_time": "8:22:02", "remaining_time": "2 days, 5:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 30076, "loss": 0.6126, "learning_rate": 9.959895669567435e-05, "epoch": 0.27262904164242374, "percentage": 13.63, "elapsed_time": "8:28:45", "remaining_time": "2 days, 5:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 30076, "loss": 0.6132, "learning_rate": 9.956144534011318e-05, "epoch": 0.2759537860526972, "percentage": 13.8, "elapsed_time": "8:35:19", "remaining_time": "2 days, 5:39:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 30076, "loss": 0.6075, "learning_rate": 9.952226493141765e-05, "epoch": 0.2792785304629707, "percentage": 13.96, "elapsed_time": "8:41:21", "remaining_time": "2 days, 5:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 30076, "loss": 0.5422, "learning_rate": 9.94814167890445e-05, "epoch": 0.2826032748732441, "percentage": 14.13, "elapsed_time": "8:47:41", "remaining_time": "2 days, 5:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 30076, "loss": 0.573, "learning_rate": 9.943890228861383e-05, "epoch": 0.2859280192835176, "percentage": 14.3, "elapsed_time": "8:54:00", "remaining_time": "2 days, 5:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 30076, "loss": 0.6314, "learning_rate": 9.939472286186271e-05, "epoch": 0.28925276369379105, "percentage": 14.46, "elapsed_time": "9:00:27", "remaining_time": "2 days, 5:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 30076, "loss": 0.5865, "learning_rate": 9.934887999659707e-05, "epoch": 0.2925775081040645, "percentage": 14.63, "elapsed_time": "9:06:45", "remaining_time": "2 days, 5:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4450, "total_steps": 30076, "loss": 0.5994, "learning_rate": 9.930137523664149e-05, "epoch": 0.29590225251433794, "percentage": 14.8, "elapsed_time": "9:13:05", "remaining_time": "2 days, 5:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 30076, "loss": 0.6174, "learning_rate": 9.925221018178728e-05, "epoch": 0.2992269969246114, "percentage": 14.96, "elapsed_time": "9:19:17", "remaining_time": "2 days, 4:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4550, "total_steps": 30076, "loss": 0.5778, "learning_rate": 9.920138648773852e-05, "epoch": 0.3025517413348849, "percentage": 15.13, "elapsed_time": "9:25:20", "remaining_time": "2 days, 4:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4600, "total_steps": 30076, "loss": 0.5745, "learning_rate": 9.914890586605638e-05, "epoch": 0.30587648574515836, "percentage": 15.29, "elapsed_time": "9:31:18", "remaining_time": "2 days, 4:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4650, "total_steps": 30076, "loss": 0.6356, "learning_rate": 9.90947700841015e-05, "epoch": 0.3092012301554318, "percentage": 15.46, "elapsed_time": "9:37:24", "remaining_time": "2 days, 4:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4700, "total_steps": 30076, "loss": 0.6593, "learning_rate": 9.903898096497441e-05, "epoch": 0.31252597456570524, "percentage": 15.63, "elapsed_time": "9:43:44", "remaining_time": "2 days, 4:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4750, "total_steps": 30076, "loss": 0.637, "learning_rate": 9.898154038745408e-05, "epoch": 0.3158507189759787, "percentage": 15.79, "elapsed_time": "9:50:02", "remaining_time": "2 days, 4:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4800, "total_steps": 30076, "loss": 0.6007, "learning_rate": 9.892245028593483e-05, "epoch": 0.3191754633862522, "percentage": 15.96, "elapsed_time": "9:56:19", "remaining_time": "2 days, 4:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4850, "total_steps": 30076, "loss": 0.5526, "learning_rate": 9.886171265036102e-05, "epoch": 0.32250020779652566, "percentage": 16.13, "elapsed_time": "10:02:24", "remaining_time": "2 days, 4:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4900, "total_steps": 30076, "loss": 0.5863, "learning_rate": 9.879932952616009e-05, "epoch": 0.3258249522067991, "percentage": 16.29, "elapsed_time": "10:08:39", "remaining_time": "2 days, 4:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4950, "total_steps": 30076, "loss": 0.579, "learning_rate": 9.873530301417373e-05, "epoch": 0.32914969661707255, "percentage": 16.46, "elapsed_time": "10:14:45", "remaining_time": "2 days, 4:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5000, "total_steps": 30076, "loss": 0.6135, "learning_rate": 9.8669635270587e-05, "epoch": 0.332474441027346, "percentage": 16.62, "elapsed_time": "10:21:23", "remaining_time": "2 days, 3:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5050, "total_steps": 30076, "loss": 0.5849, "learning_rate": 9.860232850685589e-05, "epoch": 0.3357991854376195, "percentage": 16.79, "elapsed_time": "10:27:42", "remaining_time": "2 days, 3:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5100, "total_steps": 30076, "loss": 0.591, "learning_rate": 9.853338498963272e-05, "epoch": 0.33912392984789297, "percentage": 16.96, "elapsed_time": "10:34:03", "remaining_time": "2 days, 3:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5150, "total_steps": 30076, "loss": 0.6121, "learning_rate": 9.846280704068982e-05, "epoch": 0.3424486742581664, "percentage": 17.12, "elapsed_time": "10:40:11", "remaining_time": "2 days, 3:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5200, "total_steps": 30076, "loss": 0.5705, "learning_rate": 9.839059703684139e-05, "epoch": 0.34577341866843986, "percentage": 17.29, "elapsed_time": "10:46:38", "remaining_time": "2 days, 3:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5250, "total_steps": 30076, "loss": 0.633, "learning_rate": 9.831675740986346e-05, "epoch": 0.34909816307871333, "percentage": 17.46, "elapsed_time": "10:53:01", "remaining_time": "2 days, 3:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5300, "total_steps": 30076, "loss": 0.5706, "learning_rate": 9.82412906464119e-05, "epoch": 0.3524229074889868, "percentage": 17.62, "elapsed_time": "10:59:14", "remaining_time": "2 days, 3:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5350, "total_steps": 30076, "loss": 0.5357, "learning_rate": 9.816419928793879e-05, "epoch": 0.3557476518992602, "percentage": 17.79, "elapsed_time": "11:05:43", "remaining_time": "2 days, 3:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5400, "total_steps": 30076, "loss": 0.6065, "learning_rate": 9.808548593060681e-05, "epoch": 0.3590723963095337, "percentage": 17.95, "elapsed_time": "11:11:47", "remaining_time": "2 days, 3:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5450, "total_steps": 30076, "loss": 0.5832, "learning_rate": 9.800515322520174e-05, "epoch": 0.36239714071980716, "percentage": 18.12, "elapsed_time": "11:17:48", "remaining_time": "2 days, 3:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5500, "total_steps": 30076, "loss": 0.5808, "learning_rate": 9.792320387704328e-05, "epoch": 0.36572188513008064, "percentage": 18.29, "elapsed_time": "11:23:47", "remaining_time": "2 days, 2:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5550, "total_steps": 30076, "loss": 0.6015, "learning_rate": 9.783964064589387e-05, "epoch": 0.3690466295403541, "percentage": 18.45, "elapsed_time": "11:30:21", "remaining_time": "2 days, 2:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5600, "total_steps": 30076, "loss": 0.6086, "learning_rate": 9.775446634586584e-05, "epoch": 0.3723713739506275, "percentage": 18.62, "elapsed_time": "11:36:37", "remaining_time": "2 days, 2:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5650, "total_steps": 30076, "loss": 0.5674, "learning_rate": 9.766768384532654e-05, "epoch": 0.375696118360901, "percentage": 18.79, "elapsed_time": "11:42:29", "remaining_time": "2 days, 2:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5700, "total_steps": 30076, "loss": 0.5112, "learning_rate": 9.757929606680181e-05, "epoch": 0.37902086277117447, "percentage": 18.95, "elapsed_time": "11:48:36", "remaining_time": "2 days, 2:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5750, "total_steps": 30076, "loss": 0.6066, "learning_rate": 9.748930598687752e-05, "epoch": 0.38234560718144794, "percentage": 19.12, "elapsed_time": "11:54:35", "remaining_time": "2 days, 2:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5800, "total_steps": 30076, "loss": 0.5997, "learning_rate": 9.73977166360994e-05, "epoch": 0.38567035159172136, "percentage": 19.28, "elapsed_time": "12:00:58", "remaining_time": "2 days, 2:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5850, "total_steps": 30076, "loss": 0.5986, "learning_rate": 9.730453109887087e-05, "epoch": 0.38899509600199483, "percentage": 19.45, "elapsed_time": "12:06:54", "remaining_time": "2 days, 2:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5900, "total_steps": 30076, "loss": 0.5235, "learning_rate": 9.720975251334929e-05, "epoch": 0.3923198404122683, "percentage": 19.62, "elapsed_time": "12:13:03", "remaining_time": "2 days, 2:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5950, "total_steps": 30076, "loss": 0.62, "learning_rate": 9.711338407134016e-05, "epoch": 0.3956445848225418, "percentage": 19.78, "elapsed_time": "12:19:31", "remaining_time": "2 days, 1:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6000, "total_steps": 30076, "loss": 0.583, "learning_rate": 9.701542901818974e-05, "epoch": 0.39896932923281525, "percentage": 19.95, "elapsed_time": "12:25:50", "remaining_time": "2 days, 1:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6050, "total_steps": 30076, "loss": 0.5456, "learning_rate": 9.691589065267568e-05, "epoch": 0.40229407364308867, "percentage": 20.12, "elapsed_time": "12:31:57", "remaining_time": "2 days, 1:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6100, "total_steps": 30076, "loss": 0.5725, "learning_rate": 9.681477232689596e-05, "epoch": 0.40561881805336214, "percentage": 20.28, "elapsed_time": "12:38:25", "remaining_time": "2 days, 1:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6150, "total_steps": 30076, "loss": 0.6161, "learning_rate": 9.671207744615598e-05, "epoch": 0.4089435624636356, "percentage": 20.45, "elapsed_time": "12:44:55", "remaining_time": "2 days, 1:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6200, "total_steps": 30076, "loss": 0.5519, "learning_rate": 9.660780946885397e-05, "epoch": 0.4122683068739091, "percentage": 20.61, "elapsed_time": "12:51:10", "remaining_time": "2 days, 1:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6250, "total_steps": 30076, "loss": 0.6336, "learning_rate": 9.650197190636438e-05, "epoch": 0.4155930512841825, "percentage": 20.78, "elapsed_time": "12:57:29", "remaining_time": "2 days, 1:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6300, "total_steps": 30076, "loss": 0.5666, "learning_rate": 9.639456832291974e-05, "epoch": 0.418917795694456, "percentage": 20.95, "elapsed_time": "13:03:35", "remaining_time": "2 days, 1:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6350, "total_steps": 30076, "loss": 0.55, "learning_rate": 9.628560233549058e-05, "epoch": 0.42224254010472945, "percentage": 21.11, "elapsed_time": "13:10:05", "remaining_time": "2 days, 1:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6400, "total_steps": 30076, "loss": 0.5756, "learning_rate": 9.617507761366367e-05, "epoch": 0.4255672845150029, "percentage": 21.28, "elapsed_time": "13:16:15", "remaining_time": "2 days, 1:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6450, "total_steps": 30076, "loss": 0.6014, "learning_rate": 9.606299787951836e-05, "epoch": 0.4288920289252764, "percentage": 21.45, "elapsed_time": "13:22:52", "remaining_time": "2 days, 1:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6500, "total_steps": 30076, "loss": 0.5764, "learning_rate": 9.594936690750129e-05, "epoch": 0.4322167733355498, "percentage": 21.61, "elapsed_time": "13:28:48", "remaining_time": "2 days, 0:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6550, "total_steps": 30076, "loss": 0.5548, "learning_rate": 9.583418852429933e-05, "epoch": 0.4355415177458233, "percentage": 21.78, "elapsed_time": "13:35:02", "remaining_time": "2 days, 0:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6600, "total_steps": 30076, "loss": 0.5769, "learning_rate": 9.571746660871058e-05, "epoch": 0.43886626215609675, "percentage": 21.94, "elapsed_time": "13:41:29", "remaining_time": "2 days, 0:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6650, "total_steps": 30076, "loss": 0.562, "learning_rate": 9.559920509151386e-05, "epoch": 0.4421910065663702, "percentage": 22.11, "elapsed_time": "13:47:48", "remaining_time": "2 days, 0:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6700, "total_steps": 30076, "loss": 0.5478, "learning_rate": 9.547940795533627e-05, "epoch": 0.44551575097664364, "percentage": 22.28, "elapsed_time": "13:54:12", "remaining_time": "2 days, 0:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6750, "total_steps": 30076, "loss": 0.5292, "learning_rate": 9.535807923451911e-05, "epoch": 0.4488404953869171, "percentage": 22.44, "elapsed_time": "14:00:07", "remaining_time": "2 days, 0:23:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6800, "total_steps": 30076, "loss": 0.608, "learning_rate": 9.523522301498202e-05, "epoch": 0.4521652397971906, "percentage": 22.61, "elapsed_time": "14:06:26", "remaining_time": "2 days, 0:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6850, "total_steps": 30076, "loss": 0.5555, "learning_rate": 9.511084343408531e-05, "epoch": 0.45548998420746406, "percentage": 22.78, "elapsed_time": "14:12:35", "remaining_time": "2 days, 0:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6900, "total_steps": 30076, "loss": 0.5309, "learning_rate": 9.498494468049072e-05, "epoch": 0.45881472861773753, "percentage": 22.94, "elapsed_time": "14:18:27", "remaining_time": "2 days, 0:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6950, "total_steps": 30076, "loss": 0.5725, "learning_rate": 9.485753099402031e-05, "epoch": 0.46213947302801095, "percentage": 23.11, "elapsed_time": "14:24:44", "remaining_time": "1 day, 23:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7000, "total_steps": 30076, "loss": 0.544, "learning_rate": 9.472860666551369e-05, "epoch": 0.4654642174382844, "percentage": 23.27, "elapsed_time": "14:30:55", "remaining_time": "1 day, 23:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7050, "total_steps": 30076, "loss": 0.5701, "learning_rate": 9.459817603668351e-05, "epoch": 0.4687889618485579, "percentage": 23.44, "elapsed_time": "14:36:57", "remaining_time": "1 day, 23:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7100, "total_steps": 30076, "loss": 0.5523, "learning_rate": 9.446624349996929e-05, "epoch": 0.47211370625883137, "percentage": 23.61, "elapsed_time": "14:42:47", "remaining_time": "1 day, 23:36:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7150, "total_steps": 30076, "loss": 0.5224, "learning_rate": 9.433281349838941e-05, "epoch": 0.47543845066910484, "percentage": 23.77, "elapsed_time": "14:48:49", "remaining_time": "1 day, 23:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7200, "total_steps": 30076, "loss": 0.5807, "learning_rate": 9.419789052539157e-05, "epoch": 0.47876319507937826, "percentage": 23.94, "elapsed_time": "14:55:01", "remaining_time": "1 day, 23:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7250, "total_steps": 30076, "loss": 0.5496, "learning_rate": 9.406147912470143e-05, "epoch": 0.48208793948965173, "percentage": 24.11, "elapsed_time": "15:01:31", "remaining_time": "1 day, 23:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7300, "total_steps": 30076, "loss": 0.5681, "learning_rate": 9.392358389016961e-05, "epoch": 0.4854126838999252, "percentage": 24.27, "elapsed_time": "15:07:48", "remaining_time": "1 day, 23:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7350, "total_steps": 30076, "loss": 0.5595, "learning_rate": 9.378420946561697e-05, "epoch": 0.4887374283101987, "percentage": 24.44, "elapsed_time": "15:14:15", "remaining_time": "1 day, 23:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7400, "total_steps": 30076, "loss": 0.5436, "learning_rate": 9.364336054467819e-05, "epoch": 0.4920621727204721, "percentage": 24.6, "elapsed_time": "15:20:42", "remaining_time": "1 day, 23:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7450, "total_steps": 30076, "loss": 0.5452, "learning_rate": 9.350104187064379e-05, "epoch": 0.49538691713074556, "percentage": 24.77, "elapsed_time": "15:27:28", "remaining_time": "1 day, 22:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7500, "total_steps": 30076, "loss": 0.5603, "learning_rate": 9.335725823630035e-05, "epoch": 0.49871166154101904, "percentage": 24.94, "elapsed_time": "15:33:34", "remaining_time": "1 day, 22:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7550, "total_steps": 30076, "loss": 0.517, "learning_rate": 9.321201448376904e-05, "epoch": 0.5020364059512925, "percentage": 25.1, "elapsed_time": "15:39:31", "remaining_time": "1 day, 22:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7600, "total_steps": 30076, "loss": 0.5428, "learning_rate": 9.306531550434268e-05, "epoch": 0.5053611503615659, "percentage": 25.27, "elapsed_time": "15:45:49", "remaining_time": "1 day, 22:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7650, "total_steps": 30076, "loss": 0.5486, "learning_rate": 9.291716623832091e-05, "epoch": 0.5086858947718395, "percentage": 25.44, "elapsed_time": "15:52:35", "remaining_time": "1 day, 22:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7700, "total_steps": 30076, "loss": 0.5383, "learning_rate": 9.276757167484389e-05, "epoch": 0.5120106391821129, "percentage": 25.6, "elapsed_time": "15:58:52", "remaining_time": "1 day, 22:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7750, "total_steps": 30076, "loss": 0.6017, "learning_rate": 9.261653685172422e-05, "epoch": 0.5153353835923863, "percentage": 25.77, "elapsed_time": "16:04:57", "remaining_time": "1 day, 22:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7800, "total_steps": 30076, "loss": 0.5711, "learning_rate": 9.246406685527739e-05, "epoch": 0.5186601280026598, "percentage": 25.93, "elapsed_time": "16:11:04", "remaining_time": "1 day, 22:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7850, "total_steps": 30076, "loss": 0.5859, "learning_rate": 9.231016682015035e-05, "epoch": 0.5219848724129332, "percentage": 26.1, "elapsed_time": "16:17:09", "remaining_time": "1 day, 22:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7900, "total_steps": 30076, "loss": 0.5151, "learning_rate": 9.21548419291487e-05, "epoch": 0.5253096168232068, "percentage": 26.27, "elapsed_time": "16:23:06", "remaining_time": "1 day, 21:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7950, "total_steps": 30076, "loss": 0.5288, "learning_rate": 9.19980974130621e-05, "epoch": 0.5286343612334802, "percentage": 26.43, "elapsed_time": "16:29:06", "remaining_time": "1 day, 21:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8000, "total_steps": 30076, "loss": 0.554, "learning_rate": 9.183993855048811e-05, "epoch": 0.5319591056437536, "percentage": 26.6, "elapsed_time": "16:35:06", "remaining_time": "1 day, 21:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8050, "total_steps": 30076, "loss": 0.5566, "learning_rate": 9.168037066765453e-05, "epoch": 0.5352838500540271, "percentage": 26.77, "elapsed_time": "16:41:16", "remaining_time": "1 day, 21:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8100, "total_steps": 30076, "loss": 0.5464, "learning_rate": 9.151939913823988e-05, "epoch": 0.5386085944643005, "percentage": 26.93, "elapsed_time": "16:47:53", "remaining_time": "1 day, 21:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8150, "total_steps": 30076, "loss": 0.5381, "learning_rate": 9.135702938319251e-05, "epoch": 0.5419333388745741, "percentage": 27.1, "elapsed_time": "16:54:22", "remaining_time": "1 day, 21:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8200, "total_steps": 30076, "loss": 0.528, "learning_rate": 9.119326687054802e-05, "epoch": 0.5452580832848475, "percentage": 27.26, "elapsed_time": "17:00:13", "remaining_time": "1 day, 21:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8250, "total_steps": 30076, "loss": 0.5613, "learning_rate": 9.102811711524519e-05, "epoch": 0.5485828276951209, "percentage": 27.43, "elapsed_time": "17:06:15", "remaining_time": "1 day, 21:15:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8300, "total_steps": 30076, "loss": 0.5576, "learning_rate": 9.086158567894013e-05, "epoch": 0.5519075721053944, "percentage": 27.6, "elapsed_time": "17:12:41", "remaining_time": "1 day, 21:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8350, "total_steps": 30076, "loss": 0.54, "learning_rate": 9.069367816981911e-05, "epoch": 0.5552323165156678, "percentage": 27.76, "elapsed_time": "17:18:42", "remaining_time": "1 day, 21:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8400, "total_steps": 30076, "loss": 0.4902, "learning_rate": 9.052440024240956e-05, "epoch": 0.5585570609259414, "percentage": 27.93, "elapsed_time": "17:24:46", "remaining_time": "1 day, 20:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8450, "total_steps": 30076, "loss": 0.509, "learning_rate": 9.03537575973898e-05, "epoch": 0.5618818053362148, "percentage": 28.1, "elapsed_time": "17:30:29", "remaining_time": "1 day, 20:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8500, "total_steps": 30076, "loss": 0.5154, "learning_rate": 9.018175598139696e-05, "epoch": 0.5652065497464882, "percentage": 28.26, "elapsed_time": "17:36:45", "remaining_time": "1 day, 20:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8550, "total_steps": 30076, "loss": 0.535, "learning_rate": 9.000840118683344e-05, "epoch": 0.5685312941567617, "percentage": 28.43, "elapsed_time": "17:42:57", "remaining_time": "1 day, 20:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8600, "total_steps": 30076, "loss": 0.4827, "learning_rate": 8.983369905167191e-05, "epoch": 0.5718560385670352, "percentage": 28.59, "elapsed_time": "17:49:24", "remaining_time": "1 day, 20:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8650, "total_steps": 30076, "loss": 0.5161, "learning_rate": 8.965765545925869e-05, "epoch": 0.5751807829773086, "percentage": 28.76, "elapsed_time": "17:55:37", "remaining_time": "1 day, 20:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8700, "total_steps": 30076, "loss": 0.5239, "learning_rate": 8.948027633811557e-05, "epoch": 0.5785055273875821, "percentage": 28.93, "elapsed_time": "18:02:00", "remaining_time": "1 day, 20:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8750, "total_steps": 30076, "loss": 0.5577, "learning_rate": 8.930156766174025e-05, "epoch": 0.5818302717978555, "percentage": 29.09, "elapsed_time": "18:08:26", "remaining_time": "1 day, 20:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8800, "total_steps": 30076, "loss": 0.5693, "learning_rate": 8.912153544840507e-05, "epoch": 0.585155016208129, "percentage": 29.26, "elapsed_time": "18:14:32", "remaining_time": "1 day, 20:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8850, "total_steps": 30076, "loss": 0.4972, "learning_rate": 8.894018576095439e-05, "epoch": 0.5884797606184025, "percentage": 29.43, "elapsed_time": "18:20:34", "remaining_time": "1 day, 19:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8900, "total_steps": 30076, "loss": 0.5021, "learning_rate": 8.875752470660043e-05, "epoch": 0.5918045050286759, "percentage": 29.59, "elapsed_time": "18:27:02", "remaining_time": "1 day, 19:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8950, "total_steps": 30076, "loss": 0.5546, "learning_rate": 8.857355843671757e-05, "epoch": 0.5951292494389494, "percentage": 29.76, "elapsed_time": "18:33:54", "remaining_time": "1 day, 19:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9000, "total_steps": 30076, "loss": 0.5434, "learning_rate": 8.838829314663522e-05, "epoch": 0.5984539938492228, "percentage": 29.92, "elapsed_time": "18:40:14", "remaining_time": "1 day, 19:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9050, "total_steps": 30076, "loss": 0.5041, "learning_rate": 8.820173507542915e-05, "epoch": 0.6017787382594963, "percentage": 30.09, "elapsed_time": "18:46:25", "remaining_time": "1 day, 19:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9100, "total_steps": 30076, "loss": 0.5354, "learning_rate": 8.80138905057114e-05, "epoch": 0.6051034826697698, "percentage": 30.26, "elapsed_time": "18:52:51", "remaining_time": "1 day, 19:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9150, "total_steps": 30076, "loss": 0.5127, "learning_rate": 8.782476576341873e-05, "epoch": 0.6084282270800432, "percentage": 30.42, "elapsed_time": "18:58:53", "remaining_time": "1 day, 19:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9200, "total_steps": 30076, "loss": 0.4883, "learning_rate": 8.763436721759952e-05, "epoch": 0.6117529714903167, "percentage": 30.59, "elapsed_time": "19:04:39", "remaining_time": "1 day, 19:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9250, "total_steps": 30076, "loss": 0.4566, "learning_rate": 8.744270128019934e-05, "epoch": 0.6150777159005901, "percentage": 30.76, "elapsed_time": "19:10:58", "remaining_time": "1 day, 19:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9300, "total_steps": 30076, "loss": 0.5758, "learning_rate": 8.724977440584497e-05, "epoch": 0.6184024603108637, "percentage": 30.92, "elapsed_time": "19:16:48", "remaining_time": "1 day, 19:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9350, "total_steps": 30076, "loss": 0.5346, "learning_rate": 8.705559309162712e-05, "epoch": 0.6217272047211371, "percentage": 31.09, "elapsed_time": "19:23:16", "remaining_time": "1 day, 18:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9400, "total_steps": 30076, "loss": 0.5128, "learning_rate": 8.686016387688153e-05, "epoch": 0.6250519491314105, "percentage": 31.25, "elapsed_time": "19:29:37", "remaining_time": "1 day, 18:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9450, "total_steps": 30076, "loss": 0.4906, "learning_rate": 8.666349334296877e-05, "epoch": 0.628376693541684, "percentage": 31.42, "elapsed_time": "19:35:34", "remaining_time": "1 day, 18:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9500, "total_steps": 30076, "loss": 0.5378, "learning_rate": 8.646558811305268e-05, "epoch": 0.6317014379519574, "percentage": 31.59, "elapsed_time": "19:42:02", "remaining_time": "1 day, 18:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9550, "total_steps": 30076, "loss": 0.5361, "learning_rate": 8.626645485187722e-05, "epoch": 0.6350261823622309, "percentage": 31.75, "elapsed_time": "19:48:46", "remaining_time": "1 day, 18:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9600, "total_steps": 30076, "loss": 0.509, "learning_rate": 8.60661002655421e-05, "epoch": 0.6383509267725044, "percentage": 31.92, "elapsed_time": "19:55:01", "remaining_time": "1 day, 18:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9650, "total_steps": 30076, "loss": 0.536, "learning_rate": 8.586453110127688e-05, "epoch": 0.6416756711827778, "percentage": 32.09, "elapsed_time": "20:01:15", "remaining_time": "1 day, 18:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9700, "total_steps": 30076, "loss": 0.4913, "learning_rate": 8.566175414721384e-05, "epoch": 0.6450004155930513, "percentage": 32.25, "elapsed_time": "20:07:58", "remaining_time": "1 day, 18:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9750, "total_steps": 30076, "loss": 0.5193, "learning_rate": 8.545777623215927e-05, "epoch": 0.6483251600033247, "percentage": 32.42, "elapsed_time": "20:13:54", "remaining_time": "1 day, 18:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9800, "total_steps": 30076, "loss": 0.5351, "learning_rate": 8.525260422536358e-05, "epoch": 0.6516499044135982, "percentage": 32.58, "elapsed_time": "20:20:02", "remaining_time": "1 day, 18:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9850, "total_steps": 30076, "loss": 0.5594, "learning_rate": 8.504624503628995e-05, "epoch": 0.6549746488238717, "percentage": 32.75, "elapsed_time": "20:26:12", "remaining_time": "1 day, 17:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9900, "total_steps": 30076, "loss": 0.5219, "learning_rate": 8.483870561438161e-05, "epoch": 0.6582993932341451, "percentage": 32.92, "elapsed_time": "20:32:28", "remaining_time": "1 day, 17:51:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9950, "total_steps": 30076, "loss": 0.5606, "learning_rate": 8.462999294882783e-05, "epoch": 0.6616241376444186, "percentage": 33.08, "elapsed_time": "20:38:32", "remaining_time": "1 day, 17:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10000, "total_steps": 30076, "loss": 0.5011, "learning_rate": 8.442011406832859e-05, "epoch": 0.664948882054692, "percentage": 33.25, "elapsed_time": "20:44:37", "remaining_time": "1 day, 17:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10000, "total_steps": 30076, "eval_loss": 0.4348411560058594, "epoch": 0.664948882054692, "percentage": 33.25, "elapsed_time": "21:57:19", "remaining_time": "1 day, 20:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10050, "total_steps": 30076, "loss": 0.5451, "learning_rate": 8.420907604085781e-05, "epoch": 0.6682736264649655, "percentage": 33.42, "elapsed_time": "22:03:52", "remaining_time": "1 day, 19:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10100, "total_steps": 30076, "loss": 0.5388, "learning_rate": 8.399688597342535e-05, "epoch": 0.671598370875239, "percentage": 33.58, "elapsed_time": "22:10:11", "remaining_time": "1 day, 19:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10150, "total_steps": 30076, "loss": 0.5205, "learning_rate": 8.378355101183769e-05, "epoch": 0.6749231152855124, "percentage": 33.75, "elapsed_time": "22:16:41", "remaining_time": "1 day, 19:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10200, "total_steps": 30076, "loss": 0.5349, "learning_rate": 8.356907834045726e-05, "epoch": 0.6782478596957859, "percentage": 33.91, "elapsed_time": "22:22:38", "remaining_time": "1 day, 19:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10250, "total_steps": 30076, "loss": 0.4955, "learning_rate": 8.335347518196052e-05, "epoch": 0.6815726041060594, "percentage": 34.08, "elapsed_time": "22:29:06", "remaining_time": "1 day, 19:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10300, "total_steps": 30076, "loss": 0.5571, "learning_rate": 8.313674879709475e-05, "epoch": 0.6848973485163328, "percentage": 34.25, "elapsed_time": "22:35:39", "remaining_time": "1 day, 19:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10350, "total_steps": 30076, "loss": 0.5335, "learning_rate": 8.29189064844334e-05, "epoch": 0.6882220929266063, "percentage": 34.41, "elapsed_time": "22:41:50", "remaining_time": "1 day, 19:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10400, "total_steps": 30076, "loss": 0.5151, "learning_rate": 8.269995558013049e-05, "epoch": 0.6915468373368797, "percentage": 34.58, "elapsed_time": "22:47:26", "remaining_time": "1 day, 19:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10450, "total_steps": 30076, "loss": 0.4983, "learning_rate": 8.24799034576734e-05, "epoch": 0.6948715817471531, "percentage": 34.75, "elapsed_time": "22:53:19", "remaining_time": "1 day, 18:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10500, "total_steps": 30076, "loss": 0.5027, "learning_rate": 8.225875752763468e-05, "epoch": 0.6981963261574267, "percentage": 34.91, "elapsed_time": "22:59:39", "remaining_time": "1 day, 18:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10550, "total_steps": 30076, "loss": 0.4735, "learning_rate": 8.203652523742237e-05, "epoch": 0.7015210705677001, "percentage": 35.08, "elapsed_time": "23:06:10", "remaining_time": "1 day, 18:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10600, "total_steps": 30076, "loss": 0.4945, "learning_rate": 8.181321407102929e-05, "epoch": 0.7048458149779736, "percentage": 35.24, "elapsed_time": "23:12:15", "remaining_time": "1 day, 18:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10650, "total_steps": 30076, "loss": 0.5094, "learning_rate": 8.158883154878094e-05, "epoch": 0.708170559388247, "percentage": 35.41, "elapsed_time": "23:18:58", "remaining_time": "1 day, 18:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10700, "total_steps": 30076, "loss": 0.5064, "learning_rate": 8.136338522708233e-05, "epoch": 0.7114953037985204, "percentage": 35.58, "elapsed_time": "23:25:10", "remaining_time": "1 day, 18:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10750, "total_steps": 30076, "loss": 0.4934, "learning_rate": 8.11368826981634e-05, "epoch": 0.714820048208794, "percentage": 35.74, "elapsed_time": "23:31:41", "remaining_time": "1 day, 18:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10800, "total_steps": 30076, "loss": 0.5097, "learning_rate": 8.090933158982338e-05, "epoch": 0.7181447926190674, "percentage": 35.91, "elapsed_time": "23:37:49", "remaining_time": "1 day, 18:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10850, "total_steps": 30076, "loss": 0.4923, "learning_rate": 8.068073956517397e-05, "epoch": 0.7214695370293409, "percentage": 36.08, "elapsed_time": "23:43:42", "remaining_time": "1 day, 18:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10900, "total_steps": 30076, "loss": 0.4611, "learning_rate": 8.045111432238121e-05, "epoch": 0.7247942814396143, "percentage": 36.24, "elapsed_time": "23:49:28", "remaining_time": "1 day, 17:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10950, "total_steps": 30076, "loss": 0.5119, "learning_rate": 8.022046359440623e-05, "epoch": 0.7281190258498877, "percentage": 36.41, "elapsed_time": "23:55:48", "remaining_time": "1 day, 17:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11000, "total_steps": 30076, "loss": 0.5359, "learning_rate": 7.998879514874491e-05, "epoch": 0.7314437702601613, "percentage": 36.57, "elapsed_time": "1 day, 0:02:22", "remaining_time": "1 day, 17:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11050, "total_steps": 30076, "loss": 0.532, "learning_rate": 7.975611678716615e-05, "epoch": 0.7347685146704347, "percentage": 36.74, "elapsed_time": "1 day, 0:08:50", "remaining_time": "1 day, 17:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11100, "total_steps": 30076, "loss": 0.4793, "learning_rate": 7.952243634544929e-05, "epoch": 0.7380932590807082, "percentage": 36.91, "elapsed_time": "1 day, 0:15:24", "remaining_time": "1 day, 17:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11150, "total_steps": 30076, "loss": 0.4981, "learning_rate": 7.928776169312016e-05, "epoch": 0.7414180034909816, "percentage": 37.07, "elapsed_time": "1 day, 0:21:50", "remaining_time": "1 day, 17:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11200, "total_steps": 30076, "loss": 0.4578, "learning_rate": 7.905210073318605e-05, "epoch": 0.744742747901255, "percentage": 37.24, "elapsed_time": "1 day, 0:27:41", "remaining_time": "1 day, 17:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11250, "total_steps": 30076, "loss": 0.5101, "learning_rate": 7.881546140186958e-05, "epoch": 0.7480674923115286, "percentage": 37.41, "elapsed_time": "1 day, 0:34:05", "remaining_time": "1 day, 17:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11300, "total_steps": 30076, "loss": 0.4905, "learning_rate": 7.857785166834144e-05, "epoch": 0.751392236721802, "percentage": 37.57, "elapsed_time": "1 day, 0:40:20", "remaining_time": "1 day, 16:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11350, "total_steps": 30076, "loss": 0.4868, "learning_rate": 7.833927953445202e-05, "epoch": 0.7547169811320755, "percentage": 37.74, "elapsed_time": "1 day, 0:46:51", "remaining_time": "1 day, 16:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11400, "total_steps": 30076, "loss": 0.5107, "learning_rate": 7.809975303446195e-05, "epoch": 0.7580417255423489, "percentage": 37.9, "elapsed_time": "1 day, 0:53:13", "remaining_time": "1 day, 16:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11450, "total_steps": 30076, "loss": 0.4964, "learning_rate": 7.785928023477142e-05, "epoch": 0.7613664699526224, "percentage": 38.07, "elapsed_time": "1 day, 0:59:35", "remaining_time": "1 day, 16:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11500, "total_steps": 30076, "loss": 0.5179, "learning_rate": 7.761786923364878e-05, "epoch": 0.7646912143628959, "percentage": 38.24, "elapsed_time": "1 day, 1:05:56", "remaining_time": "1 day, 16:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11550, "total_steps": 30076, "loss": 0.4624, "learning_rate": 7.737552816095754e-05, "epoch": 0.7680159587731693, "percentage": 38.4, "elapsed_time": "1 day, 1:12:15", "remaining_time": "1 day, 16:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11600, "total_steps": 30076, "loss": 0.4917, "learning_rate": 7.713226517788275e-05, "epoch": 0.7713407031834427, "percentage": 38.57, "elapsed_time": "1 day, 1:18:40", "remaining_time": "1 day, 16:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11650, "total_steps": 30076, "loss": 0.523, "learning_rate": 7.688808847665612e-05, "epoch": 0.7746654475937162, "percentage": 38.74, "elapsed_time": "1 day, 1:24:59", "remaining_time": "1 day, 16:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11700, "total_steps": 30076, "loss": 0.5019, "learning_rate": 7.664300628028017e-05, "epoch": 0.7779901920039897, "percentage": 38.9, "elapsed_time": "1 day, 1:31:14", "remaining_time": "1 day, 16:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11750, "total_steps": 30076, "loss": 0.5049, "learning_rate": 7.639702684225123e-05, "epoch": 0.7813149364142632, "percentage": 39.07, "elapsed_time": "1 day, 1:37:03", "remaining_time": "1 day, 15:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11800, "total_steps": 30076, "loss": 0.4823, "learning_rate": 7.615015844628157e-05, "epoch": 0.7846396808245366, "percentage": 39.23, "elapsed_time": "1 day, 1:43:26", "remaining_time": "1 day, 15:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11850, "total_steps": 30076, "loss": 0.4591, "learning_rate": 7.590240940602036e-05, "epoch": 0.78796442523481, "percentage": 39.4, "elapsed_time": "1 day, 1:49:46", "remaining_time": "1 day, 15:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11900, "total_steps": 30076, "loss": 0.4851, "learning_rate": 7.565378806477377e-05, "epoch": 0.7912891696450836, "percentage": 39.57, "elapsed_time": "1 day, 1:55:58", "remaining_time": "1 day, 15:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11950, "total_steps": 30076, "loss": 0.4735, "learning_rate": 7.540430279522395e-05, "epoch": 0.794613914055357, "percentage": 39.73, "elapsed_time": "1 day, 2:02:23", "remaining_time": "1 day, 15:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12000, "total_steps": 30076, "loss": 0.4941, "learning_rate": 7.515396199914708e-05, "epoch": 0.7979386584656305, "percentage": 39.9, "elapsed_time": "1 day, 2:08:55", "remaining_time": "1 day, 15:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12050, "total_steps": 30076, "loss": 0.4753, "learning_rate": 7.490277410713044e-05, "epoch": 0.8012634028759039, "percentage": 40.07, "elapsed_time": "1 day, 2:15:15", "remaining_time": "1 day, 15:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12100, "total_steps": 30076, "loss": 0.5152, "learning_rate": 7.46507475782885e-05, "epoch": 0.8045881472861773, "percentage": 40.23, "elapsed_time": "1 day, 2:21:32", "remaining_time": "1 day, 15:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12150, "total_steps": 30076, "loss": 0.523, "learning_rate": 7.439789089997796e-05, "epoch": 0.8079128916964509, "percentage": 40.4, "elapsed_time": "1 day, 2:27:55", "remaining_time": "1 day, 15:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12200, "total_steps": 30076, "loss": 0.4939, "learning_rate": 7.414421258751212e-05, "epoch": 0.8112376361067243, "percentage": 40.56, "elapsed_time": "1 day, 2:33:50", "remaining_time": "1 day, 14:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12250, "total_steps": 30076, "loss": 0.4787, "learning_rate": 7.38897211838739e-05, "epoch": 0.8145623805169978, "percentage": 40.73, "elapsed_time": "1 day, 2:40:23", "remaining_time": "1 day, 14:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12300, "total_steps": 30076, "loss": 0.4973, "learning_rate": 7.363442525942826e-05, "epoch": 0.8178871249272712, "percentage": 40.9, "elapsed_time": "1 day, 2:46:47", "remaining_time": "1 day, 14:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12350, "total_steps": 30076, "loss": 0.51, "learning_rate": 7.337833341163358e-05, "epoch": 0.8212118693375446, "percentage": 41.06, "elapsed_time": "1 day, 2:53:17", "remaining_time": "1 day, 14:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12400, "total_steps": 30076, "loss": 0.5298, "learning_rate": 7.31214542647521e-05, "epoch": 0.8245366137478182, "percentage": 41.23, "elapsed_time": "1 day, 2:59:42", "remaining_time": "1 day, 14:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12450, "total_steps": 30076, "loss": 0.492, "learning_rate": 7.286379646955946e-05, "epoch": 0.8278613581580916, "percentage": 41.4, "elapsed_time": "1 day, 3:06:18", "remaining_time": "1 day, 14:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12500, "total_steps": 30076, "loss": 0.4854, "learning_rate": 7.260536870305347e-05, "epoch": 0.831186102568365, "percentage": 41.56, "elapsed_time": "1 day, 3:12:10", "remaining_time": "1 day, 14:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12550, "total_steps": 30076, "loss": 0.4439, "learning_rate": 7.234617966816174e-05, "epoch": 0.8345108469786385, "percentage": 41.73, "elapsed_time": "1 day, 3:18:17", "remaining_time": "1 day, 14:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12600, "total_steps": 30076, "loss": 0.4949, "learning_rate": 7.208623809344879e-05, "epoch": 0.837835591388912, "percentage": 41.89, "elapsed_time": "1 day, 3:24:39", "remaining_time": "1 day, 14:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12650, "total_steps": 30076, "loss": 0.5091, "learning_rate": 7.182555273282193e-05, "epoch": 0.8411603357991855, "percentage": 42.06, "elapsed_time": "1 day, 3:30:44", "remaining_time": "1 day, 13:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12700, "total_steps": 30076, "loss": 0.4732, "learning_rate": 7.156413236523656e-05, "epoch": 0.8444850802094589, "percentage": 42.23, "elapsed_time": "1 day, 3:36:48", "remaining_time": "1 day, 13:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12750, "total_steps": 30076, "loss": 0.4639, "learning_rate": 7.130198579440052e-05, "epoch": 0.8478098246197323, "percentage": 42.39, "elapsed_time": "1 day, 3:42:56", "remaining_time": "1 day, 13:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12800, "total_steps": 30076, "loss": 0.4818, "learning_rate": 7.103912184847757e-05, "epoch": 0.8511345690300058, "percentage": 42.56, "elapsed_time": "1 day, 3:49:12", "remaining_time": "1 day, 13:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12850, "total_steps": 30076, "loss": 0.4424, "learning_rate": 7.07755493797901e-05, "epoch": 0.8544593134402793, "percentage": 42.73, "elapsed_time": "1 day, 3:55:10", "remaining_time": "1 day, 13:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12900, "total_steps": 30076, "loss": 0.4551, "learning_rate": 7.051127726452102e-05, "epoch": 0.8577840578505528, "percentage": 42.89, "elapsed_time": "1 day, 4:00:56", "remaining_time": "1 day, 13:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12950, "total_steps": 30076, "loss": 0.4496, "learning_rate": 7.024631440241491e-05, "epoch": 0.8611088022608262, "percentage": 43.06, "elapsed_time": "1 day, 4:06:55", "remaining_time": "1 day, 13:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13000, "total_steps": 30076, "loss": 0.49, "learning_rate": 6.998066971647817e-05, "epoch": 0.8644335466710996, "percentage": 43.22, "elapsed_time": "1 day, 4:13:02", "remaining_time": "1 day, 13:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13050, "total_steps": 30076, "loss": 0.4822, "learning_rate": 6.971435215267866e-05, "epoch": 0.8677582910813731, "percentage": 43.39, "elapsed_time": "1 day, 4:19:22", "remaining_time": "1 day, 12:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13100, "total_steps": 30076, "loss": 0.4665, "learning_rate": 6.944737067964429e-05, "epoch": 0.8710830354916466, "percentage": 43.56, "elapsed_time": "1 day, 4:25:41", "remaining_time": "1 day, 12:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13150, "total_steps": 30076, "loss": 0.4762, "learning_rate": 6.917973428836118e-05, "epoch": 0.8744077799019201, "percentage": 43.72, "elapsed_time": "1 day, 4:31:43", "remaining_time": "1 day, 12:43:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13200, "total_steps": 30076, "loss": 0.4301, "learning_rate": 6.891145199187065e-05, "epoch": 0.8777325243121935, "percentage": 43.89, "elapsed_time": "1 day, 4:38:05", "remaining_time": "1 day, 12:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13250, "total_steps": 30076, "loss": 0.5202, "learning_rate": 6.864253282496595e-05, "epoch": 0.8810572687224669, "percentage": 44.06, "elapsed_time": "1 day, 4:44:50", "remaining_time": "1 day, 12:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13300, "total_steps": 30076, "loss": 0.4664, "learning_rate": 6.837298584388771e-05, "epoch": 0.8843820131327405, "percentage": 44.22, "elapsed_time": "1 day, 4:50:57", "remaining_time": "1 day, 12:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13350, "total_steps": 30076, "loss": 0.4748, "learning_rate": 6.810282012601923e-05, "epoch": 0.8877067575430139, "percentage": 44.39, "elapsed_time": "1 day, 4:57:18", "remaining_time": "1 day, 12:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13400, "total_steps": 30076, "loss": 0.4798, "learning_rate": 6.783204476958058e-05, "epoch": 0.8910315019532873, "percentage": 44.55, "elapsed_time": "1 day, 5:03:22", "remaining_time": "1 day, 12:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13450, "total_steps": 30076, "loss": 0.5189, "learning_rate": 6.75606688933223e-05, "epoch": 0.8943562463635608, "percentage": 44.72, "elapsed_time": "1 day, 5:09:50", "remaining_time": "1 day, 12:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13500, "total_steps": 30076, "loss": 0.4913, "learning_rate": 6.728870163621836e-05, "epoch": 0.8976809907738342, "percentage": 44.89, "elapsed_time": "1 day, 5:15:55", "remaining_time": "1 day, 11:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13550, "total_steps": 30076, "loss": 0.453, "learning_rate": 6.701615215715829e-05, "epoch": 0.9010057351841078, "percentage": 45.05, "elapsed_time": "1 day, 5:22:21", "remaining_time": "1 day, 11:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13600, "total_steps": 30076, "loss": 0.459, "learning_rate": 6.674302963463876e-05, "epoch": 0.9043304795943812, "percentage": 45.22, "elapsed_time": "1 day, 5:28:35", "remaining_time": "1 day, 11:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13650, "total_steps": 30076, "loss": 0.5119, "learning_rate": 6.646934326645452e-05, "epoch": 0.9076552240046546, "percentage": 45.39, "elapsed_time": "1 day, 5:34:22", "remaining_time": "1 day, 11:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13700, "total_steps": 30076, "loss": 0.4414, "learning_rate": 6.61951022693887e-05, "epoch": 0.9109799684149281, "percentage": 45.55, "elapsed_time": "1 day, 5:40:13", "remaining_time": "1 day, 11:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13750, "total_steps": 30076, "loss": 0.5148, "learning_rate": 6.592031587890224e-05, "epoch": 0.9143047128252015, "percentage": 45.72, "elapsed_time": "1 day, 5:46:18", "remaining_time": "1 day, 11:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13800, "total_steps": 30076, "loss": 0.4998, "learning_rate": 6.564499334882312e-05, "epoch": 0.9176294572354751, "percentage": 45.88, "elapsed_time": "1 day, 5:52:40", "remaining_time": "1 day, 11:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13850, "total_steps": 30076, "loss": 0.5493, "learning_rate": 6.536914395103446e-05, "epoch": 0.9209542016457485, "percentage": 46.05, "elapsed_time": "1 day, 5:58:47", "remaining_time": "1 day, 11:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13900, "total_steps": 30076, "loss": 0.4527, "learning_rate": 6.509277697516255e-05, "epoch": 0.9242789460560219, "percentage": 46.22, "elapsed_time": "1 day, 6:04:46", "remaining_time": "1 day, 11:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13950, "total_steps": 30076, "loss": 0.4917, "learning_rate": 6.481590172826371e-05, "epoch": 0.9276036904662954, "percentage": 46.38, "elapsed_time": "1 day, 6:11:04", "remaining_time": "1 day, 10:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14000, "total_steps": 30076, "loss": 0.5103, "learning_rate": 6.453852753451119e-05, "epoch": 0.9309284348765688, "percentage": 46.55, "elapsed_time": "1 day, 6:17:28", "remaining_time": "1 day, 10:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14050, "total_steps": 30076, "loss": 0.4945, "learning_rate": 6.426066373488084e-05, "epoch": 0.9342531792868424, "percentage": 46.71, "elapsed_time": "1 day, 6:24:09", "remaining_time": "1 day, 10:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14100, "total_steps": 30076, "loss": 0.5453, "learning_rate": 6.39823196868368e-05, "epoch": 0.9375779236971158, "percentage": 46.88, "elapsed_time": "1 day, 6:30:17", "remaining_time": "1 day, 10:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14150, "total_steps": 30076, "loss": 0.4735, "learning_rate": 6.370350476401624e-05, "epoch": 0.9409026681073892, "percentage": 47.05, "elapsed_time": "1 day, 6:36:47", "remaining_time": "1 day, 10:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14200, "total_steps": 30076, "loss": 0.5343, "learning_rate": 6.342422835591368e-05, "epoch": 0.9442274125176627, "percentage": 47.21, "elapsed_time": "1 day, 6:43:10", "remaining_time": "1 day, 10:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14250, "total_steps": 30076, "loss": 0.5078, "learning_rate": 6.314449986756489e-05, "epoch": 0.9475521569279362, "percentage": 47.38, "elapsed_time": "1 day, 6:49:34", "remaining_time": "1 day, 10:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14300, "total_steps": 30076, "loss": 0.4985, "learning_rate": 6.286432871923e-05, "epoch": 0.9508769013382097, "percentage": 47.55, "elapsed_time": "1 day, 6:56:13", "remaining_time": "1 day, 10:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14350, "total_steps": 30076, "loss": 0.4495, "learning_rate": 6.258372434607645e-05, "epoch": 0.9542016457484831, "percentage": 47.71, "elapsed_time": "1 day, 7:02:24", "remaining_time": "1 day, 10:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14400, "total_steps": 30076, "loss": 0.4606, "learning_rate": 6.230269619786111e-05, "epoch": 0.9575263901587565, "percentage": 47.88, "elapsed_time": "1 day, 7:08:29", "remaining_time": "1 day, 9:54:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14450, "total_steps": 30076, "loss": 0.4699, "learning_rate": 6.202125373861207e-05, "epoch": 0.96085113456903, "percentage": 48.04, "elapsed_time": "1 day, 7:14:57", "remaining_time": "1 day, 9:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14500, "total_steps": 30076, "loss": 0.4802, "learning_rate": 6.173940644630996e-05, "epoch": 0.9641758789793035, "percentage": 48.21, "elapsed_time": "1 day, 7:21:02", "remaining_time": "1 day, 9:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14550, "total_steps": 30076, "loss": 0.4557, "learning_rate": 6.145716381256873e-05, "epoch": 0.9675006233895769, "percentage": 48.38, "elapsed_time": "1 day, 7:27:19", "remaining_time": "1 day, 9:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14600, "total_steps": 30076, "loss": 0.4472, "learning_rate": 6.117453534231606e-05, "epoch": 0.9708253677998504, "percentage": 48.54, "elapsed_time": "1 day, 7:33:44", "remaining_time": "1 day, 9:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14650, "total_steps": 30076, "loss": 0.4498, "learning_rate": 6.0891530553473195e-05, "epoch": 0.9741501122101238, "percentage": 48.71, "elapsed_time": "1 day, 7:40:05", "remaining_time": "1 day, 9:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14700, "total_steps": 30076, "loss": 0.4741, "learning_rate": 6.060815897663447e-05, "epoch": 0.9774748566203973, "percentage": 48.88, "elapsed_time": "1 day, 7:46:28", "remaining_time": "1 day, 9:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14750, "total_steps": 30076, "loss": 0.4821, "learning_rate": 6.0324430154746316e-05, "epoch": 0.9807996010306708, "percentage": 49.04, "elapsed_time": "1 day, 7:52:52", "remaining_time": "1 day, 9:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14800, "total_steps": 30076, "loss": 0.4687, "learning_rate": 6.004035364278593e-05, "epoch": 0.9841243454409442, "percentage": 49.21, "elapsed_time": "1 day, 7:59:09", "remaining_time": "1 day, 9:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14850, "total_steps": 30076, "loss": 0.427, "learning_rate": 5.9755939007439445e-05, "epoch": 0.9874490898512177, "percentage": 49.37, "elapsed_time": "1 day, 8:05:18", "remaining_time": "1 day, 8:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14900, "total_steps": 30076, "loss": 0.4594, "learning_rate": 5.9471195826779834e-05, "epoch": 0.9907738342614911, "percentage": 49.54, "elapsed_time": "1 day, 8:11:28", "remaining_time": "1 day, 8:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14950, "total_steps": 30076, "loss": 0.482, "learning_rate": 5.918613368994423e-05, "epoch": 0.9940985786717647, "percentage": 49.71, "elapsed_time": "1 day, 8:17:43", "remaining_time": "1 day, 8:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15000, "total_steps": 30076, "loss": 0.4322, "learning_rate": 5.8900762196811175e-05, "epoch": 0.9974233230820381, "percentage": 49.87, "elapsed_time": "1 day, 8:23:44", "remaining_time": "1 day, 8:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15050, "total_steps": 30076, "loss": 0.4441, "learning_rate": 5.861509095767714e-05, "epoch": 1.0007480674923115, "percentage": 50.04, "elapsed_time": "1 day, 8:30:13", "remaining_time": "1 day, 8:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15100, "total_steps": 30076, "loss": 0.4052, "learning_rate": 5.832912959293304e-05, "epoch": 1.004072811902585, "percentage": 50.21, "elapsed_time": "1 day, 8:36:20", "remaining_time": "1 day, 8:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15150, "total_steps": 30076, "loss": 0.4061, "learning_rate": 5.804288773274011e-05, "epoch": 1.0073975563128585, "percentage": 50.37, "elapsed_time": "1 day, 8:42:27", "remaining_time": "1 day, 8:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15200, "total_steps": 30076, "loss": 0.3922, "learning_rate": 5.775637501670579e-05, "epoch": 1.0107223007231319, "percentage": 50.54, "elapsed_time": "1 day, 8:48:43", "remaining_time": "1 day, 8:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15250, "total_steps": 30076, "loss": 0.444, "learning_rate": 5.7469601093558854e-05, "epoch": 1.0140470451334054, "percentage": 50.7, "elapsed_time": "1 day, 8:54:48", "remaining_time": "1 day, 7:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15300, "total_steps": 30076, "loss": 0.4149, "learning_rate": 5.718257562082471e-05, "epoch": 1.017371789543679, "percentage": 50.87, "elapsed_time": "1 day, 9:01:07", "remaining_time": "1 day, 7:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15350, "total_steps": 30076, "loss": 0.3901, "learning_rate": 5.689530826449997e-05, "epoch": 1.0206965339539522, "percentage": 51.04, "elapsed_time": "1 day, 9:07:11", "remaining_time": "1 day, 7:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15400, "total_steps": 30076, "loss": 0.4268, "learning_rate": 5.660780869872711e-05, "epoch": 1.0240212783642257, "percentage": 51.2, "elapsed_time": "1 day, 9:13:33", "remaining_time": "1 day, 7:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15450, "total_steps": 30076, "loss": 0.4328, "learning_rate": 5.632008660546853e-05, "epoch": 1.0273460227744993, "percentage": 51.37, "elapsed_time": "1 day, 9:19:48", "remaining_time": "1 day, 7:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15500, "total_steps": 30076, "loss": 0.3798, "learning_rate": 5.6032151674180575e-05, "epoch": 1.0306707671847726, "percentage": 51.54, "elapsed_time": "1 day, 9:25:47", "remaining_time": "1 day, 7:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15550, "total_steps": 30076, "loss": 0.4215, "learning_rate": 5.574401360148727e-05, "epoch": 1.033995511595046, "percentage": 51.7, "elapsed_time": "1 day, 9:31:42", "remaining_time": "1 day, 7:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15600, "total_steps": 30076, "loss": 0.4242, "learning_rate": 5.5455682090853624e-05, "epoch": 1.0373202560053196, "percentage": 51.87, "elapsed_time": "1 day, 9:37:42", "remaining_time": "1 day, 7:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15650, "total_steps": 30076, "loss": 0.4163, "learning_rate": 5.5167166852259055e-05, "epoch": 1.0406450004155932, "percentage": 52.03, "elapsed_time": "1 day, 9:44:07", "remaining_time": "1 day, 7:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15700, "total_steps": 30076, "loss": 0.3637, "learning_rate": 5.4878477601870194e-05, "epoch": 1.0439697448258665, "percentage": 52.2, "elapsed_time": "1 day, 9:50:17", "remaining_time": "1 day, 6:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15750, "total_steps": 30076, "loss": 0.4117, "learning_rate": 5.458962406171384e-05, "epoch": 1.04729448923614, "percentage": 52.37, "elapsed_time": "1 day, 9:56:22", "remaining_time": "1 day, 6:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15800, "total_steps": 30076, "loss": 0.4177, "learning_rate": 5.430061595934941e-05, "epoch": 1.0506192336464135, "percentage": 52.53, "elapsed_time": "1 day, 10:02:11", "remaining_time": "1 day, 6:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15850, "total_steps": 30076, "loss": 0.4446, "learning_rate": 5.401146302754153e-05, "epoch": 1.0539439780566868, "percentage": 52.7, "elapsed_time": "1 day, 10:08:36", "remaining_time": "1 day, 6:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15900, "total_steps": 30076, "loss": 0.4097, "learning_rate": 5.372217500393205e-05, "epoch": 1.0572687224669604, "percentage": 52.87, "elapsed_time": "1 day, 10:14:40", "remaining_time": "1 day, 6:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15950, "total_steps": 30076, "loss": 0.378, "learning_rate": 5.3432761630712335e-05, "epoch": 1.0605934668772339, "percentage": 53.03, "elapsed_time": "1 day, 10:21:03", "remaining_time": "1 day, 6:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16000, "total_steps": 30076, "loss": 0.373, "learning_rate": 5.314323265429501e-05, "epoch": 1.0639182112875072, "percentage": 53.2, "elapsed_time": "1 day, 10:27:04", "remaining_time": "1 day, 6:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16050, "total_steps": 30076, "loss": 0.4159, "learning_rate": 5.285359782498582e-05, "epoch": 1.0672429556977807, "percentage": 53.36, "elapsed_time": "1 day, 10:33:14", "remaining_time": "1 day, 6:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16100, "total_steps": 30076, "loss": 0.4017, "learning_rate": 5.2563866896655275e-05, "epoch": 1.0705677001080542, "percentage": 53.53, "elapsed_time": "1 day, 10:39:17", "remaining_time": "1 day, 6:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16150, "total_steps": 30076, "loss": 0.4627, "learning_rate": 5.227404962641016e-05, "epoch": 1.0738924445183278, "percentage": 53.7, "elapsed_time": "1 day, 10:45:37", "remaining_time": "1 day, 5:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16200, "total_steps": 30076, "loss": 0.4073, "learning_rate": 5.198415577426493e-05, "epoch": 1.077217188928601, "percentage": 53.86, "elapsed_time": "1 day, 10:52:04", "remaining_time": "1 day, 5:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16250, "total_steps": 30076, "loss": 0.4024, "learning_rate": 5.1694195102813046e-05, "epoch": 1.0805419333388746, "percentage": 54.03, "elapsed_time": "1 day, 10:58:39", "remaining_time": "1 day, 5:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16300, "total_steps": 30076, "loss": 0.4322, "learning_rate": 5.140417737689822e-05, "epoch": 1.0838666777491481, "percentage": 54.2, "elapsed_time": "1 day, 11:04:54", "remaining_time": "1 day, 5:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16350, "total_steps": 30076, "loss": 0.3967, "learning_rate": 5.111411236328555e-05, "epoch": 1.0871914221594214, "percentage": 54.36, "elapsed_time": "1 day, 11:11:04", "remaining_time": "1 day, 5:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16400, "total_steps": 30076, "loss": 0.4123, "learning_rate": 5.0824009830332606e-05, "epoch": 1.090516166569695, "percentage": 54.53, "elapsed_time": "1 day, 11:17:25", "remaining_time": "1 day, 5:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16450, "total_steps": 30076, "loss": 0.398, "learning_rate": 5.053387954766049e-05, "epoch": 1.0938409109799685, "percentage": 54.69, "elapsed_time": "1 day, 11:24:07", "remaining_time": "1 day, 5:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16500, "total_steps": 30076, "loss": 0.4162, "learning_rate": 5.02437312858248e-05, "epoch": 1.0971656553902418, "percentage": 54.86, "elapsed_time": "1 day, 11:30:27", "remaining_time": "1 day, 5:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16550, "total_steps": 30076, "loss": 0.3965, "learning_rate": 4.995357481598663e-05, "epoch": 1.1004903998005153, "percentage": 55.03, "elapsed_time": "1 day, 11:36:28", "remaining_time": "1 day, 5:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16600, "total_steps": 30076, "loss": 0.4073, "learning_rate": 4.966341990958347e-05, "epoch": 1.1038151442107889, "percentage": 55.19, "elapsed_time": "1 day, 11:42:33", "remaining_time": "1 day, 4:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16650, "total_steps": 30076, "loss": 0.4228, "learning_rate": 4.937327633800018e-05, "epoch": 1.1071398886210622, "percentage": 55.36, "elapsed_time": "1 day, 11:48:42", "remaining_time": "1 day, 4:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16700, "total_steps": 30076, "loss": 0.3919, "learning_rate": 4.908315387223985e-05, "epoch": 1.1104646330313357, "percentage": 55.53, "elapsed_time": "1 day, 11:54:47", "remaining_time": "1 day, 4:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16750, "total_steps": 30076, "loss": 0.3981, "learning_rate": 4.87930622825949e-05, "epoch": 1.1137893774416092, "percentage": 55.69, "elapsed_time": "1 day, 12:00:58", "remaining_time": "1 day, 4:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16800, "total_steps": 30076, "loss": 0.4203, "learning_rate": 4.850301133831786e-05, "epoch": 1.1171141218518827, "percentage": 55.86, "elapsed_time": "1 day, 12:07:41", "remaining_time": "1 day, 4:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16850, "total_steps": 30076, "loss": 0.4215, "learning_rate": 4.821301080729249e-05, "epoch": 1.120438866262156, "percentage": 56.02, "elapsed_time": "1 day, 12:14:02", "remaining_time": "1 day, 4:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16900, "total_steps": 30076, "loss": 0.4055, "learning_rate": 4.792307045570486e-05, "epoch": 1.1237636106724296, "percentage": 56.19, "elapsed_time": "1 day, 12:20:30", "remaining_time": "1 day, 4:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16950, "total_steps": 30076, "loss": 0.3586, "learning_rate": 4.7633200047714345e-05, "epoch": 1.127088355082703, "percentage": 56.36, "elapsed_time": "1 day, 12:26:48", "remaining_time": "1 day, 4:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17000, "total_steps": 30076, "loss": 0.4116, "learning_rate": 4.734340934512492e-05, "epoch": 1.1304130994929764, "percentage": 56.52, "elapsed_time": "1 day, 12:33:04", "remaining_time": "1 day, 4:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17050, "total_steps": 30076, "loss": 0.4024, "learning_rate": 4.70537081070563e-05, "epoch": 1.13373784390325, "percentage": 56.69, "elapsed_time": "1 day, 12:39:16", "remaining_time": "1 day, 4:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17100, "total_steps": 30076, "loss": 0.4162, "learning_rate": 4.6764106089615454e-05, "epoch": 1.1370625883135235, "percentage": 56.86, "elapsed_time": "1 day, 12:45:27", "remaining_time": "1 day, 3:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17150, "total_steps": 30076, "loss": 0.3925, "learning_rate": 4.647461304556787e-05, "epoch": 1.1403873327237968, "percentage": 57.02, "elapsed_time": "1 day, 12:51:30", "remaining_time": "1 day, 3:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17200, "total_steps": 30076, "loss": 0.4147, "learning_rate": 4.618523872400921e-05, "epoch": 1.1437120771340703, "percentage": 57.19, "elapsed_time": "1 day, 12:57:50", "remaining_time": "1 day, 3:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17250, "total_steps": 30076, "loss": 0.4036, "learning_rate": 4.589599287003703e-05, "epoch": 1.1470368215443438, "percentage": 57.35, "elapsed_time": "1 day, 13:03:56", "remaining_time": "1 day, 3:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17300, "total_steps": 30076, "loss": 0.4285, "learning_rate": 4.56068852244225e-05, "epoch": 1.1503615659546171, "percentage": 57.52, "elapsed_time": "1 day, 13:10:26", "remaining_time": "1 day, 3:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17350, "total_steps": 30076, "loss": 0.3751, "learning_rate": 4.5317925523282464e-05, "epoch": 1.1536863103648907, "percentage": 57.69, "elapsed_time": "1 day, 13:16:25", "remaining_time": "1 day, 3:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17400, "total_steps": 30076, "loss": 0.408, "learning_rate": 4.5029123497751514e-05, "epoch": 1.1570110547751642, "percentage": 57.85, "elapsed_time": "1 day, 13:23:09", "remaining_time": "1 day, 3:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17450, "total_steps": 30076, "loss": 0.4105, "learning_rate": 4.474048887365426e-05, "epoch": 1.1603357991854377, "percentage": 58.02, "elapsed_time": "1 day, 13:29:24", "remaining_time": "1 day, 3:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17500, "total_steps": 30076, "loss": 0.3618, "learning_rate": 4.445203137117788e-05, "epoch": 1.163660543595711, "percentage": 58.19, "elapsed_time": "1 day, 13:35:57", "remaining_time": "1 day, 3:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17550, "total_steps": 30076, "loss": 0.4433, "learning_rate": 4.4163760704544675e-05, "epoch": 1.1669852880059846, "percentage": 58.35, "elapsed_time": "1 day, 13:42:23", "remaining_time": "1 day, 2:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17600, "total_steps": 30076, "loss": 0.4128, "learning_rate": 4.3875686581685e-05, "epoch": 1.170310032416258, "percentage": 58.52, "elapsed_time": "1 day, 13:48:32", "remaining_time": "1 day, 2:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17650, "total_steps": 30076, "loss": 0.4035, "learning_rate": 4.358781870391033e-05, "epoch": 1.1736347768265314, "percentage": 58.68, "elapsed_time": "1 day, 13:55:07", "remaining_time": "1 day, 2:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17700, "total_steps": 30076, "loss": 0.3809, "learning_rate": 4.330016676558651e-05, "epoch": 1.176959521236805, "percentage": 58.85, "elapsed_time": "1 day, 14:01:04", "remaining_time": "1 day, 2:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17750, "total_steps": 30076, "loss": 0.3875, "learning_rate": 4.3012740453807346e-05, "epoch": 1.1802842656470784, "percentage": 59.02, "elapsed_time": "1 day, 14:07:23", "remaining_time": "1 day, 2:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17800, "total_steps": 30076, "loss": 0.4059, "learning_rate": 4.272554944806831e-05, "epoch": 1.1836090100573518, "percentage": 59.18, "elapsed_time": "1 day, 14:13:58", "remaining_time": "1 day, 2:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17850, "total_steps": 30076, "loss": 0.385, "learning_rate": 4.243860341994062e-05, "epoch": 1.1869337544676253, "percentage": 59.35, "elapsed_time": "1 day, 14:19:54", "remaining_time": "1 day, 2:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17900, "total_steps": 30076, "loss": 0.433, "learning_rate": 4.2151912032745547e-05, "epoch": 1.1902584988778988, "percentage": 59.52, "elapsed_time": "1 day, 14:26:17", "remaining_time": "1 day, 2:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17950, "total_steps": 30076, "loss": 0.3464, "learning_rate": 4.18654849412289e-05, "epoch": 1.1935832432881721, "percentage": 59.68, "elapsed_time": "1 day, 14:32:18", "remaining_time": "1 day, 2:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18000, "total_steps": 30076, "loss": 0.406, "learning_rate": 4.157933179123599e-05, "epoch": 1.1969079876984456, "percentage": 59.85, "elapsed_time": "1 day, 14:38:24", "remaining_time": "1 day, 1:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18050, "total_steps": 30076, "loss": 0.4521, "learning_rate": 4.129346221938676e-05, "epoch": 1.2002327321087192, "percentage": 60.01, "elapsed_time": "1 day, 14:44:18", "remaining_time": "1 day, 1:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18100, "total_steps": 30076, "loss": 0.3983, "learning_rate": 4.100788585275125e-05, "epoch": 1.2035574765189927, "percentage": 60.18, "elapsed_time": "1 day, 14:50:42", "remaining_time": "1 day, 1:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18150, "total_steps": 30076, "loss": 0.4084, "learning_rate": 4.0722612308525335e-05, "epoch": 1.206882220929266, "percentage": 60.35, "elapsed_time": "1 day, 14:56:50", "remaining_time": "1 day, 1:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18200, "total_steps": 30076, "loss": 0.3673, "learning_rate": 4.043765119370699e-05, "epoch": 1.2102069653395395, "percentage": 60.51, "elapsed_time": "1 day, 15:02:49", "remaining_time": "1 day, 1:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18250, "total_steps": 30076, "loss": 0.3686, "learning_rate": 4.0153012104772635e-05, "epoch": 1.213531709749813, "percentage": 60.68, "elapsed_time": "1 day, 15:08:41", "remaining_time": "1 day, 1:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18300, "total_steps": 30076, "loss": 0.4034, "learning_rate": 3.9868704627354e-05, "epoch": 1.2168564541600864, "percentage": 60.85, "elapsed_time": "1 day, 15:15:06", "remaining_time": "1 day, 1:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18350, "total_steps": 30076, "loss": 0.3896, "learning_rate": 3.9584738335915314e-05, "epoch": 1.22018119857036, "percentage": 61.01, "elapsed_time": "1 day, 15:21:11", "remaining_time": "1 day, 1:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18400, "total_steps": 30076, "loss": 0.3943, "learning_rate": 3.930112279343094e-05, "epoch": 1.2235059429806334, "percentage": 61.18, "elapsed_time": "1 day, 15:27:12", "remaining_time": "1 day, 1:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18450, "total_steps": 30076, "loss": 0.3821, "learning_rate": 3.9017867551063184e-05, "epoch": 1.226830687390907, "percentage": 61.34, "elapsed_time": "1 day, 15:33:17", "remaining_time": "1 day, 0:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18500, "total_steps": 30076, "loss": 0.3888, "learning_rate": 3.8734982147840756e-05, "epoch": 1.2301554318011803, "percentage": 61.51, "elapsed_time": "1 day, 15:39:40", "remaining_time": "1 day, 0:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18550, "total_steps": 30076, "loss": 0.4109, "learning_rate": 3.845247611033749e-05, "epoch": 1.2334801762114538, "percentage": 61.68, "elapsed_time": "1 day, 15:45:26", "remaining_time": "1 day, 0:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18600, "total_steps": 30076, "loss": 0.3897, "learning_rate": 3.817035895235159e-05, "epoch": 1.236804920621727, "percentage": 61.84, "elapsed_time": "1 day, 15:51:47", "remaining_time": "1 day, 0:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18650, "total_steps": 30076, "loss": 0.3637, "learning_rate": 3.7888640174585096e-05, "epoch": 1.2401296650320006, "percentage": 62.01, "elapsed_time": "1 day, 15:58:03", "remaining_time": "1 day, 0:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18700, "total_steps": 30076, "loss": 0.3688, "learning_rate": 3.760732926432407e-05, "epoch": 1.2434544094422741, "percentage": 62.18, "elapsed_time": "1 day, 16:04:22", "remaining_time": "1 day, 0:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18750, "total_steps": 30076, "loss": 0.412, "learning_rate": 3.732643569511901e-05, "epoch": 1.2467791538525477, "percentage": 62.34, "elapsed_time": "1 day, 16:10:38", "remaining_time": "1 day, 0:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18800, "total_steps": 30076, "loss": 0.4127, "learning_rate": 3.704596892646593e-05, "epoch": 1.250103898262821, "percentage": 62.51, "elapsed_time": "1 day, 16:16:56", "remaining_time": "1 day, 0:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18850, "total_steps": 30076, "loss": 0.3849, "learning_rate": 3.676593840348765e-05, "epoch": 1.2534286426730945, "percentage": 62.67, "elapsed_time": "1 day, 16:23:06", "remaining_time": "1 day, 0:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18900, "total_steps": 30076, "loss": 0.412, "learning_rate": 3.648635355661577e-05, "epoch": 1.256753387083368, "percentage": 62.84, "elapsed_time": "1 day, 16:29:27", "remaining_time": "23:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18950, "total_steps": 30076, "loss": 0.4414, "learning_rate": 3.6207223801273196e-05, "epoch": 1.2600781314936413, "percentage": 63.01, "elapsed_time": "1 day, 16:36:03", "remaining_time": "23:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19000, "total_steps": 30076, "loss": 0.3557, "learning_rate": 3.5928558537556895e-05, "epoch": 1.2634028759039149, "percentage": 63.17, "elapsed_time": "1 day, 16:42:18", "remaining_time": "23:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19050, "total_steps": 30076, "loss": 0.3692, "learning_rate": 3.565036714992142e-05, "epoch": 1.2667276203141884, "percentage": 63.34, "elapsed_time": "1 day, 16:48:45", "remaining_time": "23:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19100, "total_steps": 30076, "loss": 0.3895, "learning_rate": 3.537265900686286e-05, "epoch": 1.270052364724462, "percentage": 63.51, "elapsed_time": "1 day, 16:54:57", "remaining_time": "23:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19150, "total_steps": 30076, "loss": 0.3645, "learning_rate": 3.5095443460603405e-05, "epoch": 1.2733771091347352, "percentage": 63.67, "elapsed_time": "1 day, 17:01:13", "remaining_time": "23:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19200, "total_steps": 30076, "loss": 0.3473, "learning_rate": 3.4818729846776254e-05, "epoch": 1.2767018535450088, "percentage": 63.84, "elapsed_time": "1 day, 17:07:58", "remaining_time": "23:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19250, "total_steps": 30076, "loss": 0.3837, "learning_rate": 3.4542527484111365e-05, "epoch": 1.280026597955282, "percentage": 64.0, "elapsed_time": "1 day, 17:14:21", "remaining_time": "23:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19300, "total_steps": 30076, "loss": 0.3911, "learning_rate": 3.426684567412153e-05, "epoch": 1.2833513423655556, "percentage": 64.17, "elapsed_time": "1 day, 17:21:04", "remaining_time": "23:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19350, "total_steps": 30076, "loss": 0.4085, "learning_rate": 3.3991693700789235e-05, "epoch": 1.2866760867758291, "percentage": 64.34, "elapsed_time": "1 day, 17:27:25", "remaining_time": "22:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19400, "total_steps": 30076, "loss": 0.37, "learning_rate": 3.371708083025392e-05, "epoch": 1.2900008311861026, "percentage": 64.5, "elapsed_time": "1 day, 17:33:37", "remaining_time": "22:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19450, "total_steps": 30076, "loss": 0.359, "learning_rate": 3.344301631049993e-05, "epoch": 1.293325575596376, "percentage": 64.67, "elapsed_time": "1 day, 17:39:49", "remaining_time": "22:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19500, "total_steps": 30076, "loss": 0.3657, "learning_rate": 3.316950937104518e-05, "epoch": 1.2966503200066495, "percentage": 64.84, "elapsed_time": "1 day, 17:46:21", "remaining_time": "22:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19550, "total_steps": 30076, "loss": 0.3981, "learning_rate": 3.2896569222630224e-05, "epoch": 1.299975064416923, "percentage": 65.0, "elapsed_time": "1 day, 17:52:25", "remaining_time": "22:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19600, "total_steps": 30076, "loss": 0.3821, "learning_rate": 3.26242050569081e-05, "epoch": 1.3032998088271963, "percentage": 65.17, "elapsed_time": "1 day, 17:58:47", "remaining_time": "22:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19650, "total_steps": 30076, "loss": 0.3534, "learning_rate": 3.235242604613478e-05, "epoch": 1.3066245532374698, "percentage": 65.33, "elapsed_time": "1 day, 18:04:45", "remaining_time": "22:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19700, "total_steps": 30076, "loss": 0.3691, "learning_rate": 3.208124134286038e-05, "epoch": 1.3099492976477434, "percentage": 65.5, "elapsed_time": "1 day, 18:10:42", "remaining_time": "22:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19750, "total_steps": 30076, "loss": 0.3995, "learning_rate": 3.181066007962079e-05, "epoch": 1.313274042058017, "percentage": 65.67, "elapsed_time": "1 day, 18:17:08", "remaining_time": "22:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19800, "total_steps": 30076, "loss": 0.422, "learning_rate": 3.1540691368630185e-05, "epoch": 1.3165987864682902, "percentage": 65.83, "elapsed_time": "1 day, 18:22:51", "remaining_time": "21:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19850, "total_steps": 30076, "loss": 0.4023, "learning_rate": 3.127134430147417e-05, "epoch": 1.3199235308785637, "percentage": 66.0, "elapsed_time": "1 day, 18:29:15", "remaining_time": "21:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19900, "total_steps": 30076, "loss": 0.4225, "learning_rate": 3.100262794880363e-05, "epoch": 1.323248275288837, "percentage": 66.17, "elapsed_time": "1 day, 18:35:17", "remaining_time": "21:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19950, "total_steps": 30076, "loss": 0.4148, "learning_rate": 3.073455136002919e-05, "epoch": 1.3265730196991106, "percentage": 66.33, "elapsed_time": "1 day, 18:41:19", "remaining_time": "21:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20000, "total_steps": 30076, "loss": 0.4008, "learning_rate": 3.0467123563016513e-05, "epoch": 1.329897764109384, "percentage": 66.5, "elapsed_time": "1 day, 18:47:07", "remaining_time": "21:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20000, "total_steps": 30076, "eval_loss": 0.36843690276145935, "epoch": 1.329897764109384, "percentage": 66.5, "elapsed_time": "1 day, 19:59:56", "remaining_time": "22:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20050, "total_steps": 30076, "loss": 0.3904, "learning_rate": 3.0200353563782248e-05, "epoch": 1.3332225085196576, "percentage": 66.66, "elapsed_time": "1 day, 20:05:49", "remaining_time": "22:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20100, "total_steps": 30076, "loss": 0.3746, "learning_rate": 2.9934250346190818e-05, "epoch": 1.336547252929931, "percentage": 66.83, "elapsed_time": "1 day, 20:11:57", "remaining_time": "21:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20150, "total_steps": 30076, "loss": 0.3831, "learning_rate": 2.9668822871651736e-05, "epoch": 1.3398719973402045, "percentage": 67.0, "elapsed_time": "1 day, 20:18:13", "remaining_time": "21:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20200, "total_steps": 30076, "loss": 0.376, "learning_rate": 2.9404080078817924e-05, "epoch": 1.343196741750478, "percentage": 67.16, "elapsed_time": "1 day, 20:24:48", "remaining_time": "21:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20250, "total_steps": 30076, "loss": 0.3932, "learning_rate": 2.9140030883284684e-05, "epoch": 1.3465214861607513, "percentage": 67.33, "elapsed_time": "1 day, 20:31:23", "remaining_time": "21:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20300, "total_steps": 30076, "loss": 0.4033, "learning_rate": 2.8876684177289404e-05, "epoch": 1.3498462305710248, "percentage": 67.5, "elapsed_time": "1 day, 20:37:49", "remaining_time": "21:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20350, "total_steps": 30076, "loss": 0.3659, "learning_rate": 2.861404882941212e-05, "epoch": 1.3531709749812983, "percentage": 67.66, "elapsed_time": "1 day, 20:43:45", "remaining_time": "21:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20400, "total_steps": 30076, "loss": 0.3681, "learning_rate": 2.8352133684276853e-05, "epoch": 1.3564957193915719, "percentage": 67.83, "elapsed_time": "1 day, 20:49:37", "remaining_time": "21:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20450, "total_steps": 30076, "loss": 0.4492, "learning_rate": 2.8090947562253807e-05, "epoch": 1.3598204638018452, "percentage": 67.99, "elapsed_time": "1 day, 20:55:44", "remaining_time": "21:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20500, "total_steps": 30076, "loss": 0.387, "learning_rate": 2.7830499259162213e-05, "epoch": 1.3631452082121187, "percentage": 68.16, "elapsed_time": "1 day, 21:02:01", "remaining_time": "21:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20550, "total_steps": 30076, "loss": 0.4326, "learning_rate": 2.7570797545974235e-05, "epoch": 1.3664699526223922, "percentage": 68.33, "elapsed_time": "1 day, 21:08:30", "remaining_time": "20:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20600, "total_steps": 30076, "loss": 0.4243, "learning_rate": 2.7311851168519496e-05, "epoch": 1.3697946970326655, "percentage": 68.49, "elapsed_time": "1 day, 21:14:39", "remaining_time": "20:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20650, "total_steps": 30076, "loss": 0.3845, "learning_rate": 2.7053668847190672e-05, "epoch": 1.373119441442939, "percentage": 68.66, "elapsed_time": "1 day, 21:20:40", "remaining_time": "20:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20700, "total_steps": 30076, "loss": 0.3915, "learning_rate": 2.6796259276649693e-05, "epoch": 1.3764441858532126, "percentage": 68.83, "elapsed_time": "1 day, 21:26:48", "remaining_time": "20:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20750, "total_steps": 30076, "loss": 0.3915, "learning_rate": 2.653963112553498e-05, "epoch": 1.3797689302634861, "percentage": 68.99, "elapsed_time": "1 day, 21:32:58", "remaining_time": "20:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20800, "total_steps": 30076, "loss": 0.3984, "learning_rate": 2.6283793036169603e-05, "epoch": 1.3830936746737594, "percentage": 69.16, "elapsed_time": "1 day, 21:39:08", "remaining_time": "20:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20850, "total_steps": 30076, "loss": 0.3679, "learning_rate": 2.6028753624270074e-05, "epoch": 1.386418419084033, "percentage": 69.32, "elapsed_time": "1 day, 21:45:18", "remaining_time": "20:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20900, "total_steps": 30076, "loss": 0.3808, "learning_rate": 2.5774521478656343e-05, "epoch": 1.3897431634943063, "percentage": 69.49, "elapsed_time": "1 day, 21:51:32", "remaining_time": "20:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20950, "total_steps": 30076, "loss": 0.3669, "learning_rate": 2.5521105160962473e-05, "epoch": 1.3930679079045798, "percentage": 69.66, "elapsed_time": "1 day, 21:58:00", "remaining_time": "20:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21000, "total_steps": 30076, "loss": 0.3882, "learning_rate": 2.52685132053484e-05, "epoch": 1.3963926523148533, "percentage": 69.82, "elapsed_time": "1 day, 22:04:19", "remaining_time": "19:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21050, "total_steps": 30076, "loss": 0.4083, "learning_rate": 2.501675411821241e-05, "epoch": 1.3997173967251269, "percentage": 69.99, "elapsed_time": "1 day, 22:10:48", "remaining_time": "19:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21100, "total_steps": 30076, "loss": 0.4103, "learning_rate": 2.4765836377904787e-05, "epoch": 1.4030421411354002, "percentage": 70.16, "elapsed_time": "1 day, 22:16:59", "remaining_time": "19:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21150, "total_steps": 30076, "loss": 0.3978, "learning_rate": 2.4515768434442215e-05, "epoch": 1.4063668855456737, "percentage": 70.32, "elapsed_time": "1 day, 22:23:22", "remaining_time": "19:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21200, "total_steps": 30076, "loss": 0.3907, "learning_rate": 2.4266558709223293e-05, "epoch": 1.4096916299559472, "percentage": 70.49, "elapsed_time": "1 day, 22:29:45", "remaining_time": "19:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21250, "total_steps": 30076, "loss": 0.4001, "learning_rate": 2.4018215594744835e-05, "epoch": 1.4130163743662205, "percentage": 70.65, "elapsed_time": "1 day, 22:35:51", "remaining_time": "19:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21300, "total_steps": 30076, "loss": 0.3897, "learning_rate": 2.377074745431931e-05, "epoch": 1.416341118776494, "percentage": 70.82, "elapsed_time": "1 day, 22:42:24", "remaining_time": "19:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21350, "total_steps": 30076, "loss": 0.3693, "learning_rate": 2.352416262179315e-05, "epoch": 1.4196658631867676, "percentage": 70.99, "elapsed_time": "1 day, 22:48:38", "remaining_time": "19:07:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21400, "total_steps": 30076, "loss": 0.3648, "learning_rate": 2.3278469401266178e-05, "epoch": 1.422990607597041, "percentage": 71.15, "elapsed_time": "1 day, 22:54:40", "remaining_time": "19:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21450, "total_steps": 30076, "loss": 0.3768, "learning_rate": 2.3033676066811845e-05, "epoch": 1.4263153520073144, "percentage": 71.32, "elapsed_time": "1 day, 23:00:45", "remaining_time": "18:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21500, "total_steps": 30076, "loss": 0.3326, "learning_rate": 2.2789790862198628e-05, "epoch": 1.429640096417588, "percentage": 71.49, "elapsed_time": "1 day, 23:06:50", "remaining_time": "18:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21550, "total_steps": 30076, "loss": 0.37, "learning_rate": 2.2546822000612495e-05, "epoch": 1.4329648408278612, "percentage": 71.65, "elapsed_time": "1 day, 23:13:03", "remaining_time": "18:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21600, "total_steps": 30076, "loss": 0.3777, "learning_rate": 2.2304777664380176e-05, "epoch": 1.4362895852381348, "percentage": 71.82, "elapsed_time": "1 day, 23:19:05", "remaining_time": "18:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21650, "total_steps": 30076, "loss": 0.3809, "learning_rate": 2.2063666004693695e-05, "epoch": 1.4396143296484083, "percentage": 71.98, "elapsed_time": "1 day, 23:25:05", "remaining_time": "18:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21700, "total_steps": 30076, "loss": 0.3746, "learning_rate": 2.182349514133583e-05, "epoch": 1.4429390740586818, "percentage": 72.15, "elapsed_time": "1 day, 23:31:16", "remaining_time": "18:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21750, "total_steps": 30076, "loss": 0.3536, "learning_rate": 2.1584273162406755e-05, "epoch": 1.4462638184689551, "percentage": 72.32, "elapsed_time": "1 day, 23:37:12", "remaining_time": "18:13:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21800, "total_steps": 30076, "loss": 0.3886, "learning_rate": 2.134600812405151e-05, "epoch": 1.4495885628792287, "percentage": 72.48, "elapsed_time": "1 day, 23:43:26", "remaining_time": "18:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21850, "total_steps": 30076, "loss": 0.3688, "learning_rate": 2.1108708050188825e-05, "epoch": 1.4529133072895022, "percentage": 72.65, "elapsed_time": "1 day, 23:49:38", "remaining_time": "18:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21900, "total_steps": 30076, "loss": 0.3716, "learning_rate": 2.0872380932240832e-05, "epoch": 1.4562380516997755, "percentage": 72.82, "elapsed_time": "1 day, 23:55:57", "remaining_time": "17:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21950, "total_steps": 30076, "loss": 0.3939, "learning_rate": 2.063703472886402e-05, "epoch": 1.459562796110049, "percentage": 72.98, "elapsed_time": "2 days, 0:02:03", "remaining_time": "17:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22000, "total_steps": 30076, "loss": 0.361, "learning_rate": 2.0402677365681112e-05, "epoch": 1.4628875405203225, "percentage": 73.15, "elapsed_time": "2 days, 0:08:26", "remaining_time": "17:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22050, "total_steps": 30076, "loss": 0.4137, "learning_rate": 2.0169316735014236e-05, "epoch": 1.466212284930596, "percentage": 73.31, "elapsed_time": "2 days, 0:14:33", "remaining_time": "17:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22100, "total_steps": 30076, "loss": 0.4188, "learning_rate": 1.99369606956191e-05, "epoch": 1.4695370293408694, "percentage": 73.48, "elapsed_time": "2 days, 0:20:58", "remaining_time": "17:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22150, "total_steps": 30076, "loss": 0.373, "learning_rate": 1.9705617072420392e-05, "epoch": 1.472861773751143, "percentage": 73.65, "elapsed_time": "2 days, 0:27:01", "remaining_time": "17:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22200, "total_steps": 30076, "loss": 0.3778, "learning_rate": 1.9475293656248182e-05, "epoch": 1.4761865181614162, "percentage": 73.81, "elapsed_time": "2 days, 0:33:25", "remaining_time": "17:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22250, "total_steps": 30076, "loss": 0.4243, "learning_rate": 1.9245998203575593e-05, "epoch": 1.4795112625716897, "percentage": 73.98, "elapsed_time": "2 days, 0:39:35", "remaining_time": "17:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22300, "total_steps": 30076, "loss": 0.344, "learning_rate": 1.9017738436257655e-05, "epoch": 1.4828360069819633, "percentage": 74.15, "elapsed_time": "2 days, 0:45:41", "remaining_time": "17:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22350, "total_steps": 30076, "loss": 0.3771, "learning_rate": 1.879052204127114e-05, "epoch": 1.4861607513922368, "percentage": 74.31, "elapsed_time": "2 days, 0:52:17", "remaining_time": "16:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22400, "total_steps": 30076, "loss": 0.3922, "learning_rate": 1.8564356670455767e-05, "epoch": 1.48948549580251, "percentage": 74.48, "elapsed_time": "2 days, 0:58:34", "remaining_time": "16:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22450, "total_steps": 30076, "loss": 0.3877, "learning_rate": 1.8339249940256492e-05, "epoch": 1.4928102402127836, "percentage": 74.64, "elapsed_time": "2 days, 1:04:58", "remaining_time": "16:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22500, "total_steps": 30076, "loss": 0.3898, "learning_rate": 1.8115209431467074e-05, "epoch": 1.4961349846230572, "percentage": 74.81, "elapsed_time": "2 days, 1:11:35", "remaining_time": "16:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22550, "total_steps": 30076, "loss": 0.4022, "learning_rate": 1.7892242688974664e-05, "epoch": 1.4994597290333305, "percentage": 74.98, "elapsed_time": "2 days, 1:17:52", "remaining_time": "16:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22600, "total_steps": 30076, "loss": 0.3609, "learning_rate": 1.767035722150582e-05, "epoch": 1.502784473443604, "percentage": 75.14, "elapsed_time": "2 days, 1:24:06", "remaining_time": "16:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22650, "total_steps": 30076, "loss": 0.3637, "learning_rate": 1.7449560501373567e-05, "epoch": 1.5061092178538775, "percentage": 75.31, "elapsed_time": "2 days, 1:30:07", "remaining_time": "16:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22700, "total_steps": 30076, "loss": 0.3746, "learning_rate": 1.7229859964225868e-05, "epoch": 1.509433962264151, "percentage": 75.48, "elapsed_time": "2 days, 1:36:23", "remaining_time": "16:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22750, "total_steps": 30076, "loss": 0.4118, "learning_rate": 1.7011263008795075e-05, "epoch": 1.5127587066744244, "percentage": 75.64, "elapsed_time": "2 days, 1:42:33", "remaining_time": "16:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22800, "total_steps": 30076, "loss": 0.3622, "learning_rate": 1.679377699664884e-05, "epoch": 1.5160834510846979, "percentage": 75.81, "elapsed_time": "2 days, 1:48:53", "remaining_time": "15:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22850, "total_steps": 30076, "loss": 0.3815, "learning_rate": 1.657740925194225e-05, "epoch": 1.5194081954949712, "percentage": 75.97, "elapsed_time": "2 days, 1:55:23", "remaining_time": "15:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22900, "total_steps": 30076, "loss": 0.3837, "learning_rate": 1.6362167061171063e-05, "epoch": 1.5227329399052447, "percentage": 76.14, "elapsed_time": "2 days, 2:01:46", "remaining_time": "15:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22950, "total_steps": 30076, "loss": 0.3932, "learning_rate": 1.614805767292642e-05, "epoch": 1.5260576843155182, "percentage": 76.31, "elapsed_time": "2 days, 2:08:23", "remaining_time": "15:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23000, "total_steps": 30076, "loss": 0.3485, "learning_rate": 1.5935088297650674e-05, "epoch": 1.5293824287257918, "percentage": 76.47, "elapsed_time": "2 days, 2:14:50", "remaining_time": "15:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23050, "total_steps": 30076, "loss": 0.3887, "learning_rate": 1.5723266107394653e-05, "epoch": 1.5327071731360653, "percentage": 76.64, "elapsed_time": "2 days, 2:20:59", "remaining_time": "15:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23100, "total_steps": 30076, "loss": 0.3908, "learning_rate": 1.551259823557602e-05, "epoch": 1.5360319175463386, "percentage": 76.81, "elapsed_time": "2 days, 2:27:01", "remaining_time": "15:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23150, "total_steps": 30076, "loss": 0.4156, "learning_rate": 1.530309177673912e-05, "epoch": 1.5393566619566121, "percentage": 76.97, "elapsed_time": "2 days, 2:33:27", "remaining_time": "15:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23200, "total_steps": 30076, "loss": 0.3439, "learning_rate": 1.509475378631603e-05, "epoch": 1.5426814063668854, "percentage": 77.14, "elapsed_time": "2 days, 2:39:40", "remaining_time": "15:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23250, "total_steps": 30076, "loss": 0.3763, "learning_rate": 1.4887591280389007e-05, "epoch": 1.546006150777159, "percentage": 77.3, "elapsed_time": "2 days, 2:45:39", "remaining_time": "14:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23300, "total_steps": 30076, "loss": 0.4004, "learning_rate": 1.468161123545413e-05, "epoch": 1.5493308951874325, "percentage": 77.47, "elapsed_time": "2 days, 2:52:00", "remaining_time": "14:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23350, "total_steps": 30076, "loss": 0.3433, "learning_rate": 1.4476820588186412e-05, "epoch": 1.552655639597706, "percentage": 77.64, "elapsed_time": "2 days, 2:58:20", "remaining_time": "14:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23400, "total_steps": 30076, "loss": 0.3838, "learning_rate": 1.4273226235206178e-05, "epoch": 1.5559803840079793, "percentage": 77.8, "elapsed_time": "2 days, 3:04:23", "remaining_time": "14:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23450, "total_steps": 30076, "loss": 0.3627, "learning_rate": 1.4070835032846852e-05, "epoch": 1.5593051284182529, "percentage": 77.97, "elapsed_time": "2 days, 3:10:48", "remaining_time": "14:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23500, "total_steps": 30076, "loss": 0.3698, "learning_rate": 1.3869653796923993e-05, "epoch": 1.5626298728285262, "percentage": 78.14, "elapsed_time": "2 days, 3:17:13", "remaining_time": "14:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23550, "total_steps": 30076, "loss": 0.3827, "learning_rate": 1.3669689302505778e-05, "epoch": 1.5659546172387997, "percentage": 78.3, "elapsed_time": "2 days, 3:23:25", "remaining_time": "14:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23600, "total_steps": 30076, "loss": 0.363, "learning_rate": 1.3470948283684925e-05, "epoch": 1.5692793616490732, "percentage": 78.47, "elapsed_time": "2 days, 3:29:09", "remaining_time": "14:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23650, "total_steps": 30076, "loss": 0.3504, "learning_rate": 1.3273437433351787e-05, "epoch": 1.5726041060593468, "percentage": 78.63, "elapsed_time": "2 days, 3:35:17", "remaining_time": "14:01:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23700, "total_steps": 30076, "loss": 0.4031, "learning_rate": 1.307716340296904e-05, "epoch": 1.5759288504696203, "percentage": 78.8, "elapsed_time": "2 days, 3:41:54", "remaining_time": "13:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23750, "total_steps": 30076, "loss": 0.3945, "learning_rate": 1.2882132802347647e-05, "epoch": 1.5792535948798936, "percentage": 78.97, "elapsed_time": "2 days, 3:48:06", "remaining_time": "13:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23800, "total_steps": 30076, "loss": 0.3742, "learning_rate": 1.268835219942433e-05, "epoch": 1.5825783392901671, "percentage": 79.13, "elapsed_time": "2 days, 3:54:42", "remaining_time": "13:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23850, "total_steps": 30076, "loss": 0.412, "learning_rate": 1.2495828120040288e-05, "epoch": 1.5859030837004404, "percentage": 79.3, "elapsed_time": "2 days, 4:00:51", "remaining_time": "13:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23900, "total_steps": 30076, "loss": 0.3863, "learning_rate": 1.23045670477215e-05, "epoch": 1.589227828110714, "percentage": 79.47, "elapsed_time": "2 days, 4:07:13", "remaining_time": "13:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23950, "total_steps": 30076, "loss": 0.3391, "learning_rate": 1.2114575423460333e-05, "epoch": 1.5925525725209875, "percentage": 79.63, "elapsed_time": "2 days, 4:13:22", "remaining_time": "13:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24000, "total_steps": 30076, "loss": 0.3796, "learning_rate": 1.1925859645498722e-05, "epoch": 1.595877316931261, "percentage": 79.8, "elapsed_time": "2 days, 4:19:26", "remaining_time": "13:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24050, "total_steps": 30076, "loss": 0.4019, "learning_rate": 1.1738426069112573e-05, "epoch": 1.5992020613415345, "percentage": 79.96, "elapsed_time": "2 days, 4:25:34", "remaining_time": "13:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24100, "total_steps": 30076, "loss": 0.3652, "learning_rate": 1.1552281006397819e-05, "epoch": 1.6025268057518078, "percentage": 80.13, "elapsed_time": "2 days, 4:31:34", "remaining_time": "13:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24150, "total_steps": 30076, "loss": 0.3499, "learning_rate": 1.1367430726057887e-05, "epoch": 1.6058515501620811, "percentage": 80.3, "elapsed_time": "2 days, 4:37:31", "remaining_time": "12:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24200, "total_steps": 30076, "loss": 0.3619, "learning_rate": 1.1183881453192479e-05, "epoch": 1.6091762945723547, "percentage": 80.46, "elapsed_time": "2 days, 4:43:30", "remaining_time": "12:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24250, "total_steps": 30076, "loss": 0.3463, "learning_rate": 1.1001639369088018e-05, "epoch": 1.6125010389826282, "percentage": 80.63, "elapsed_time": "2 days, 4:49:50", "remaining_time": "12:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24300, "total_steps": 30076, "loss": 0.3765, "learning_rate": 1.082071061100945e-05, "epoch": 1.6158257833929017, "percentage": 80.8, "elapsed_time": "2 days, 4:56:26", "remaining_time": "12:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24350, "total_steps": 30076, "loss": 0.3561, "learning_rate": 1.0641101271993614e-05, "epoch": 1.6191505278031753, "percentage": 80.96, "elapsed_time": "2 days, 5:02:30", "remaining_time": "12:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24400, "total_steps": 30076, "loss": 0.3863, "learning_rate": 1.0462817400643959e-05, "epoch": 1.6224752722134486, "percentage": 81.13, "elapsed_time": "2 days, 5:08:23", "remaining_time": "12:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24450, "total_steps": 30076, "loss": 0.3678, "learning_rate": 1.0285865000926925e-05, "epoch": 1.625800016623722, "percentage": 81.29, "elapsed_time": "2 days, 5:14:16", "remaining_time": "12:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24500, "total_steps": 30076, "loss": 0.3705, "learning_rate": 1.0110250031969709e-05, "epoch": 1.6291247610339954, "percentage": 81.46, "elapsed_time": "2 days, 5:20:04", "remaining_time": "12:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24550, "total_steps": 30076, "loss": 0.3429, "learning_rate": 9.935978407859624e-06, "epoch": 1.632449505444269, "percentage": 81.63, "elapsed_time": "2 days, 5:26:39", "remaining_time": "12:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24600, "total_steps": 30076, "loss": 0.3985, "learning_rate": 9.763055997444897e-06, "epoch": 1.6357742498545425, "percentage": 81.79, "elapsed_time": "2 days, 5:32:49", "remaining_time": "11:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24650, "total_steps": 30076, "loss": 0.3575, "learning_rate": 9.591488624137023e-06, "epoch": 1.639098994264816, "percentage": 81.96, "elapsed_time": "2 days, 5:39:25", "remaining_time": "11:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24700, "total_steps": 30076, "loss": 0.3721, "learning_rate": 9.421282065714676e-06, "epoch": 1.6424237386750895, "percentage": 82.13, "elapsed_time": "2 days, 5:45:21", "remaining_time": "11:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24750, "total_steps": 30076, "loss": 0.3741, "learning_rate": 9.25244205412915e-06, "epoch": 1.6457484830853628, "percentage": 82.29, "elapsed_time": "2 days, 5:51:37", "remaining_time": "11:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24800, "total_steps": 30076, "loss": 0.3259, "learning_rate": 9.08497427531128e-06, "epoch": 1.6490732274956361, "percentage": 82.46, "elapsed_time": "2 days, 5:57:50", "remaining_time": "11:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24850, "total_steps": 30076, "loss": 0.396, "learning_rate": 8.91888436897997e-06, "epoch": 1.6523979719059096, "percentage": 82.62, "elapsed_time": "2 days, 6:03:57", "remaining_time": "11:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24900, "total_steps": 30076, "loss": 0.3445, "learning_rate": 8.754177928452328e-06, "epoch": 1.6557227163161832, "percentage": 82.79, "elapsed_time": "2 days, 6:09:53", "remaining_time": "11:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24950, "total_steps": 30076, "loss": 0.387, "learning_rate": 8.590860500455217e-06, "epoch": 1.6590474607264567, "percentage": 82.96, "elapsed_time": "2 days, 6:15:56", "remaining_time": "11:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25000, "total_steps": 30076, "loss": 0.3951, "learning_rate": 8.428937584938496e-06, "epoch": 1.6623722051367302, "percentage": 83.12, "elapsed_time": "2 days, 6:22:24", "remaining_time": "11:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25050, "total_steps": 30076, "loss": 0.3673, "learning_rate": 8.268414634889848e-06, "epoch": 1.6656969495470035, "percentage": 83.29, "elapsed_time": "2 days, 6:28:56", "remaining_time": "10:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25100, "total_steps": 30076, "loss": 0.3975, "learning_rate": 8.109297056151067e-06, "epoch": 1.669021693957277, "percentage": 83.46, "elapsed_time": "2 days, 6:34:57", "remaining_time": "10:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25150, "total_steps": 30076, "loss": 0.3967, "learning_rate": 7.951590207236038e-06, "epoch": 1.6723464383675504, "percentage": 83.62, "elapsed_time": "2 days, 6:41:16", "remaining_time": "10:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25200, "total_steps": 30076, "loss": 0.3482, "learning_rate": 7.79529939915029e-06, "epoch": 1.675671182777824, "percentage": 83.79, "elapsed_time": "2 days, 6:47:28", "remaining_time": "10:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25250, "total_steps": 30076, "loss": 0.3693, "learning_rate": 7.640429895212164e-06, "epoch": 1.6789959271880974, "percentage": 83.95, "elapsed_time": "2 days, 6:53:33", "remaining_time": "10:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25300, "total_steps": 30076, "loss": 0.325, "learning_rate": 7.486986910875499e-06, "epoch": 1.682320671598371, "percentage": 84.12, "elapsed_time": "2 days, 6:59:43", "remaining_time": "10:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25350, "total_steps": 30076, "loss": 0.3634, "learning_rate": 7.3349756135540235e-06, "epoch": 1.6856454160086445, "percentage": 84.29, "elapsed_time": "2 days, 7:05:38", "remaining_time": "10:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25400, "total_steps": 30076, "loss": 0.3927, "learning_rate": 7.184401122447398e-06, "epoch": 1.6889701604189178, "percentage": 84.45, "elapsed_time": "2 days, 7:11:16", "remaining_time": "10:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25450, "total_steps": 30076, "loss": 0.3676, "learning_rate": 7.035268508368697e-06, "epoch": 1.692294904829191, "percentage": 84.62, "elapsed_time": "2 days, 7:17:34", "remaining_time": "10:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25500, "total_steps": 30076, "loss": 0.3897, "learning_rate": 6.887582793573727e-06, "epoch": 1.6956196492394646, "percentage": 84.79, "elapsed_time": "2 days, 7:23:54", "remaining_time": "9:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25550, "total_steps": 30076, "loss": 0.3922, "learning_rate": 6.741348951591908e-06, "epoch": 1.6989443936497381, "percentage": 84.95, "elapsed_time": "2 days, 7:30:15", "remaining_time": "9:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25600, "total_steps": 30076, "loss": 0.374, "learning_rate": 6.596571907058707e-06, "epoch": 1.7022691380600117, "percentage": 85.12, "elapsed_time": "2 days, 7:36:28", "remaining_time": "9:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25650, "total_steps": 30076, "loss": 0.4181, "learning_rate": 6.453256535549846e-06, "epoch": 1.7055938824702852, "percentage": 85.28, "elapsed_time": "2 days, 7:42:38", "remaining_time": "9:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25700, "total_steps": 30076, "loss": 0.3611, "learning_rate": 6.31140766341713e-06, "epoch": 1.7089186268805585, "percentage": 85.45, "elapsed_time": "2 days, 7:49:07", "remaining_time": "9:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25750, "total_steps": 30076, "loss": 0.3328, "learning_rate": 6.1710300676258385e-06, "epoch": 1.712243371290832, "percentage": 85.62, "elapsed_time": "2 days, 7:55:07", "remaining_time": "9:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25800, "total_steps": 30076, "loss": 0.3704, "learning_rate": 6.032128475593924e-06, "epoch": 1.7155681157011053, "percentage": 85.78, "elapsed_time": "2 days, 8:01:10", "remaining_time": "9:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25850, "total_steps": 30076, "loss": 0.3486, "learning_rate": 5.894707565032776e-06, "epoch": 1.7188928601113789, "percentage": 85.95, "elapsed_time": "2 days, 8:07:33", "remaining_time": "9:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25900, "total_steps": 30076, "loss": 0.3668, "learning_rate": 5.758771963789722e-06, "epoch": 1.7222176045216524, "percentage": 86.12, "elapsed_time": "2 days, 8:13:56", "remaining_time": "9:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25950, "total_steps": 30076, "loss": 0.3143, "learning_rate": 5.6243262496921245e-06, "epoch": 1.725542348931926, "percentage": 86.28, "elapsed_time": "2 days, 8:20:04", "remaining_time": "8:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26000, "total_steps": 30076, "loss": 0.3452, "learning_rate": 5.4913749503932575e-06, "epoch": 1.7288670933421995, "percentage": 86.45, "elapsed_time": "2 days, 8:26:20", "remaining_time": "8:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26050, "total_steps": 30076, "loss": 0.3903, "learning_rate": 5.359922543219848e-06, "epoch": 1.7321918377524728, "percentage": 86.61, "elapsed_time": "2 days, 8:33:02", "remaining_time": "8:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26100, "total_steps": 30076, "loss": 0.3691, "learning_rate": 5.229973455021231e-06, "epoch": 1.7355165821627463, "percentage": 86.78, "elapsed_time": "2 days, 8:39:09", "remaining_time": "8:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26150, "total_steps": 30076, "loss": 0.3174, "learning_rate": 5.101532062020325e-06, "epoch": 1.7388413265730196, "percentage": 86.95, "elapsed_time": "2 days, 8:45:07", "remaining_time": "8:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26200, "total_steps": 30076, "loss": 0.3693, "learning_rate": 4.974602689666252e-06, "epoch": 1.7421660709832931, "percentage": 87.11, "elapsed_time": "2 days, 8:51:16", "remaining_time": "8:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26250, "total_steps": 30076, "loss": 0.3869, "learning_rate": 4.8491896124886416e-06, "epoch": 1.7454908153935667, "percentage": 87.28, "elapsed_time": "2 days, 8:57:12", "remaining_time": "8:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26300, "total_steps": 30076, "loss": 0.3925, "learning_rate": 4.725297053953692e-06, "epoch": 1.7488155598038402, "percentage": 87.45, "elapsed_time": "2 days, 9:03:15", "remaining_time": "8:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26350, "total_steps": 30076, "loss": 0.3563, "learning_rate": 4.602929186321947e-06, "epoch": 1.7521403042141135, "percentage": 87.61, "elapsed_time": "2 days, 9:09:34", "remaining_time": "8:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26400, "total_steps": 30076, "loss": 0.4169, "learning_rate": 4.48209013050781e-06, "epoch": 1.755465048624387, "percentage": 87.78, "elapsed_time": "2 days, 9:15:21", "remaining_time": "7:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26450, "total_steps": 30076, "loss": 0.363, "learning_rate": 4.362783955940719e-06, "epoch": 1.7587897930346603, "percentage": 87.94, "elapsed_time": "2 days, 9:21:23", "remaining_time": "7:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26500, "total_steps": 30076, "loss": 0.3572, "learning_rate": 4.245014680428117e-06, "epoch": 1.7621145374449338, "percentage": 88.11, "elapsed_time": "2 days, 9:27:28", "remaining_time": "7:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26550, "total_steps": 30076, "loss": 0.3497, "learning_rate": 4.128786270020174e-06, "epoch": 1.7654392818552074, "percentage": 88.28, "elapsed_time": "2 days, 9:33:49", "remaining_time": "7:38:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26600, "total_steps": 30076, "loss": 0.3702, "learning_rate": 4.014102638876205e-06, "epoch": 1.768764026265481, "percentage": 88.44, "elapsed_time": "2 days, 9:40:03", "remaining_time": "7:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26650, "total_steps": 30076, "loss": 0.3662, "learning_rate": 3.900967649132847e-06, "epoch": 1.7720887706757544, "percentage": 88.61, "elapsed_time": "2 days, 9:46:46", "remaining_time": "7:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26700, "total_steps": 30076, "loss": 0.3643, "learning_rate": 3.789385110774013e-06, "epoch": 1.7754135150860277, "percentage": 88.78, "elapsed_time": "2 days, 9:52:51", "remaining_time": "7:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26750, "total_steps": 30076, "loss": 0.3834, "learning_rate": 3.679358781502562e-06, "epoch": 1.7787382594963013, "percentage": 88.94, "elapsed_time": "2 days, 9:59:06", "remaining_time": "7:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26800, "total_steps": 30076, "loss": 0.3632, "learning_rate": 3.5708923666137927e-06, "epoch": 1.7820630039065746, "percentage": 89.11, "elapsed_time": "2 days, 10:05:15", "remaining_time": "7:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26850, "total_steps": 30076, "loss": 0.3702, "learning_rate": 3.4639895188706195e-06, "epoch": 1.785387748316848, "percentage": 89.27, "elapsed_time": "2 days, 10:11:49", "remaining_time": "6:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26900, "total_steps": 30076, "loss": 0.3397, "learning_rate": 3.358653838380571e-06, "epoch": 1.7887124927271216, "percentage": 89.44, "elapsed_time": "2 days, 10:18:20", "remaining_time": "6:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26950, "total_steps": 30076, "loss": 0.3762, "learning_rate": 3.254888872474593e-06, "epoch": 1.7920372371373952, "percentage": 89.61, "elapsed_time": "2 days, 10:24:44", "remaining_time": "6:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27000, "total_steps": 30076, "loss": 0.3425, "learning_rate": 3.1526981155875156e-06, "epoch": 1.7953619815476687, "percentage": 89.77, "elapsed_time": "2 days, 10:30:58", "remaining_time": "6:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27050, "total_steps": 30076, "loss": 0.3708, "learning_rate": 3.0520850091404263e-06, "epoch": 1.798686725957942, "percentage": 89.94, "elapsed_time": "2 days, 10:37:18", "remaining_time": "6:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27100, "total_steps": 30076, "loss": 0.3675, "learning_rate": 2.9530529414247608e-06, "epoch": 1.8020114703682153, "percentage": 90.11, "elapsed_time": "2 days, 10:43:30", "remaining_time": "6:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27150, "total_steps": 30076, "loss": 0.3647, "learning_rate": 2.8556052474881967e-06, "epoch": 1.8053362147784888, "percentage": 90.27, "elapsed_time": "2 days, 10:50:00", "remaining_time": "6:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27200, "total_steps": 30076, "loss": 0.3456, "learning_rate": 2.7597452090223354e-06, "epoch": 1.8086609591887624, "percentage": 90.44, "elapsed_time": "2 days, 10:56:06", "remaining_time": "6:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27250, "total_steps": 30076, "loss": 0.3746, "learning_rate": 2.6654760542521917e-06, "epoch": 1.8119857035990359, "percentage": 90.6, "elapsed_time": "2 days, 11:02:43", "remaining_time": "6:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27300, "total_steps": 30076, "loss": 0.3798, "learning_rate": 2.572800957827476e-06, "epoch": 1.8153104480093094, "percentage": 90.77, "elapsed_time": "2 days, 11:09:01", "remaining_time": "6:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27350, "total_steps": 30076, "loss": 0.3713, "learning_rate": 2.4817230407156946e-06, "epoch": 1.8186351924195827, "percentage": 90.94, "elapsed_time": "2 days, 11:15:11", "remaining_time": "5:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27400, "total_steps": 30076, "loss": 0.3976, "learning_rate": 2.3922453700970295e-06, "epoch": 1.8219599368298562, "percentage": 91.1, "elapsed_time": "2 days, 11:21:23", "remaining_time": "5:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27450, "total_steps": 30076, "loss": 0.3788, "learning_rate": 2.3043709592610485e-06, "epoch": 1.8252846812401295, "percentage": 91.27, "elapsed_time": "2 days, 11:27:17", "remaining_time": "5:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27500, "total_steps": 30076, "loss": 0.3672, "learning_rate": 2.2181027675052534e-06, "epoch": 1.828609425650403, "percentage": 91.44, "elapsed_time": "2 days, 11:33:27", "remaining_time": "5:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27550, "total_steps": 30076, "loss": 0.3382, "learning_rate": 2.133443700035387e-06, "epoch": 1.8319341700606766, "percentage": 91.6, "elapsed_time": "2 days, 11:39:26", "remaining_time": "5:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27600, "total_steps": 30076, "loss": 0.4051, "learning_rate": 2.0503966078676217e-06, "epoch": 1.8352589144709501, "percentage": 91.77, "elapsed_time": "2 days, 11:45:54", "remaining_time": "5:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27650, "total_steps": 30076, "loss": 0.3855, "learning_rate": 1.9689642877325165e-06, "epoch": 1.8385836588812237, "percentage": 91.93, "elapsed_time": "2 days, 11:52:05", "remaining_time": "5:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27700, "total_steps": 30076, "loss": 0.366, "learning_rate": 1.8891494819808841e-06, "epoch": 1.841908403291497, "percentage": 92.1, "elapsed_time": "2 days, 11:58:32", "remaining_time": "5:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27750, "total_steps": 30076, "loss": 0.3469, "learning_rate": 1.8109548784913887e-06, "epoch": 1.8452331477017703, "percentage": 92.27, "elapsed_time": "2 days, 12:04:55", "remaining_time": "5:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27800, "total_steps": 30076, "loss": 0.3724, "learning_rate": 1.7343831105800511e-06, "epoch": 1.8485578921120438, "percentage": 92.43, "elapsed_time": "2 days, 12:11:01", "remaining_time": "4:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27850, "total_steps": 30076, "loss": 0.353, "learning_rate": 1.6594367569115532e-06, "epoch": 1.8518826365223173, "percentage": 92.6, "elapsed_time": "2 days, 12:17:26", "remaining_time": "4:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27900, "total_steps": 30076, "loss": 0.3689, "learning_rate": 1.5861183414124403e-06, "epoch": 1.8552073809325909, "percentage": 92.76, "elapsed_time": "2 days, 12:24:02", "remaining_time": "4:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27950, "total_steps": 30076, "loss": 0.3341, "learning_rate": 1.514430333186062e-06, "epoch": 1.8585321253428644, "percentage": 92.93, "elapsed_time": "2 days, 12:29:57", "remaining_time": "4:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28000, "total_steps": 30076, "loss": 0.3709, "learning_rate": 1.4443751464294664e-06, "epoch": 1.8618568697531377, "percentage": 93.1, "elapsed_time": "2 days, 12:36:15", "remaining_time": "4:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28050, "total_steps": 30076, "loss": 0.3433, "learning_rate": 1.3759551403520643e-06, "epoch": 1.8651816141634112, "percentage": 93.26, "elapsed_time": "2 days, 12:42:14", "remaining_time": "4:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28100, "total_steps": 30076, "loss": 0.3337, "learning_rate": 1.3091726190962329e-06, "epoch": 1.8685063585736845, "percentage": 93.43, "elapsed_time": "2 days, 12:48:17", "remaining_time": "4:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28150, "total_steps": 30076, "loss": 0.3475, "learning_rate": 1.2440298316596654e-06, "epoch": 1.871831102983958, "percentage": 93.6, "elapsed_time": "2 days, 12:54:16", "remaining_time": "4:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28200, "total_steps": 30076, "loss": 0.3441, "learning_rate": 1.18052897181965e-06, "epoch": 1.8751558473942316, "percentage": 93.76, "elapsed_time": "2 days, 13:00:28", "remaining_time": "4:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28250, "total_steps": 30076, "loss": 0.3793, "learning_rate": 1.1186721780592102e-06, "epoch": 1.878480591804505, "percentage": 93.93, "elapsed_time": "2 days, 13:06:46", "remaining_time": "3:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28300, "total_steps": 30076, "loss": 0.3656, "learning_rate": 1.0584615334950643e-06, "epoch": 1.8818053362147786, "percentage": 94.09, "elapsed_time": "2 days, 13:13:09", "remaining_time": "3:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28350, "total_steps": 30076, "loss": 0.3368, "learning_rate": 9.998990658074914e-07, "epoch": 1.885130080625052, "percentage": 94.26, "elapsed_time": "2 days, 13:19:09", "remaining_time": "3:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28400, "total_steps": 30076, "loss": 0.3631, "learning_rate": 9.429867471720255e-07, "epoch": 1.8884548250353252, "percentage": 94.43, "elapsed_time": "2 days, 13:25:26", "remaining_time": "3:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28450, "total_steps": 30076, "loss": 0.3569, "learning_rate": 8.877264941930586e-07, "epoch": 1.8917795694455988, "percentage": 94.59, "elapsed_time": "2 days, 13:31:29", "remaining_time": "3:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28500, "total_steps": 30076, "loss": 0.4227, "learning_rate": 8.341201678392974e-07, "epoch": 1.8951043138558723, "percentage": 94.76, "elapsed_time": "2 days, 13:37:37", "remaining_time": "3:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28550, "total_steps": 30076, "loss": 0.3959, "learning_rate": 7.821695733810641e-07, "epoch": 1.8984290582661458, "percentage": 94.93, "elapsed_time": "2 days, 13:44:00", "remaining_time": "3:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28600, "total_steps": 30076, "loss": 0.3363, "learning_rate": 7.318764603295447e-07, "epoch": 1.9017538026764194, "percentage": 95.09, "elapsed_time": "2 days, 13:50:07", "remaining_time": "3:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28650, "total_steps": 30076, "loss": 0.395, "learning_rate": 6.832425223778304e-07, "epoch": 1.9050785470866927, "percentage": 95.26, "elapsed_time": "2 days, 13:56:13", "remaining_time": "3:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28700, "total_steps": 30076, "loss": 0.352, "learning_rate": 6.362693973439193e-07, "epoch": 1.9084032914969662, "percentage": 95.42, "elapsed_time": "2 days, 14:02:30", "remaining_time": "2:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28750, "total_steps": 30076, "loss": 0.3362, "learning_rate": 5.909586671155098e-07, "epoch": 1.9117280359072395, "percentage": 95.59, "elapsed_time": "2 days, 14:08:48", "remaining_time": "2:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28800, "total_steps": 30076, "loss": 0.3586, "learning_rate": 5.47311857596794e-07, "epoch": 1.915052780317513, "percentage": 95.76, "elapsed_time": "2 days, 14:15:00", "remaining_time": "2:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28850, "total_steps": 30076, "loss": 0.3757, "learning_rate": 5.05330438657009e-07, "epoch": 1.9183775247277866, "percentage": 95.92, "elapsed_time": "2 days, 14:21:34", "remaining_time": "2:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28900, "total_steps": 30076, "loss": 0.3783, "learning_rate": 4.6501582408096657e-07, "epoch": 1.92170226913806, "percentage": 96.09, "elapsed_time": "2 days, 14:27:45", "remaining_time": "2:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28950, "total_steps": 30076, "loss": 0.3516, "learning_rate": 4.263693715214456e-07, "epoch": 1.9250270135483336, "percentage": 96.26, "elapsed_time": "2 days, 14:33:48", "remaining_time": "2:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29000, "total_steps": 30076, "loss": 0.3414, "learning_rate": 3.893923824534629e-07, "epoch": 1.928351757958607, "percentage": 96.42, "elapsed_time": "2 days, 14:39:35", "remaining_time": "2:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29050, "total_steps": 30076, "loss": 0.3867, "learning_rate": 3.5408610213043536e-07, "epoch": 1.9316765023688804, "percentage": 96.59, "elapsed_time": "2 days, 14:45:34", "remaining_time": "2:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29100, "total_steps": 30076, "loss": 0.3588, "learning_rate": 3.204517195422696e-07, "epoch": 1.9350012467791537, "percentage": 96.75, "elapsed_time": "2 days, 14:51:45", "remaining_time": "2:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29150, "total_steps": 30076, "loss": 0.3816, "learning_rate": 2.8849036737528813e-07, "epoch": 1.9383259911894273, "percentage": 96.92, "elapsed_time": "2 days, 14:57:45", "remaining_time": "2:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29200, "total_steps": 30076, "loss": 0.3547, "learning_rate": 2.5820312197411543e-07, "epoch": 1.9416507355997008, "percentage": 97.09, "elapsed_time": "2 days, 15:03:55", "remaining_time": "1:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29250, "total_steps": 30076, "loss": 0.3763, "learning_rate": 2.2959100330541273e-07, "epoch": 1.9449754800099743, "percentage": 97.25, "elapsed_time": "2 days, 15:10:16", "remaining_time": "1:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29300, "total_steps": 30076, "loss": 0.3524, "learning_rate": 2.0265497492352735e-07, "epoch": 1.9483002244202476, "percentage": 97.42, "elapsed_time": "2 days, 15:16:42", "remaining_time": "1:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29350, "total_steps": 30076, "loss": 0.3532, "learning_rate": 1.7739594393805793e-07, "epoch": 1.9516249688305212, "percentage": 97.59, "elapsed_time": "2 days, 15:23:06", "remaining_time": "1:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29400, "total_steps": 30076, "loss": 0.3787, "learning_rate": 1.538147609832896e-07, "epoch": 1.9549497132407945, "percentage": 97.75, "elapsed_time": "2 days, 15:29:59", "remaining_time": "1:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29450, "total_steps": 30076, "loss": 0.3813, "learning_rate": 1.3191222018956174e-07, "epoch": 1.958274457651068, "percentage": 97.92, "elapsed_time": "2 days, 15:36:02", "remaining_time": "1:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29500, "total_steps": 30076, "loss": 0.3346, "learning_rate": 1.1168905915652228e-07, "epoch": 1.9615992020613415, "percentage": 98.08, "elapsed_time": "2 days, 15:42:06", "remaining_time": "1:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29550, "total_steps": 30076, "loss": 0.3695, "learning_rate": 9.314595892827016e-08, "epoch": 1.964923946471615, "percentage": 98.25, "elapsed_time": "2 days, 15:48:28", "remaining_time": "1:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29600, "total_steps": 30076, "loss": 0.3579, "learning_rate": 7.628354397045123e-08, "epoch": 1.9682486908818886, "percentage": 98.42, "elapsed_time": "2 days, 15:54:44", "remaining_time": "1:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29650, "total_steps": 30076, "loss": 0.3449, "learning_rate": 6.110238214919739e-08, "epoch": 1.971573435292162, "percentage": 98.58, "elapsed_time": "2 days, 16:00:45", "remaining_time": "0:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29700, "total_steps": 30076, "loss": 0.3598, "learning_rate": 4.760298471201963e-08, "epoch": 1.9748981797024354, "percentage": 98.75, "elapsed_time": "2 days, 16:06:57", "remaining_time": "0:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29750, "total_steps": 30076, "loss": 0.3437, "learning_rate": 3.5785806270599575e-08, "epoch": 1.9782229241127087, "percentage": 98.92, "elapsed_time": "2 days, 16:12:53", "remaining_time": "0:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29800, "total_steps": 30076, "loss": 0.361, "learning_rate": 2.565124478545733e-08, "epoch": 1.9815476685229823, "percentage": 99.08, "elapsed_time": "2 days, 16:19:30", "remaining_time": "0:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29850, "total_steps": 30076, "loss": 0.3668, "learning_rate": 1.719964155256215e-08, "epoch": 1.9848724129332558, "percentage": 99.25, "elapsed_time": "2 days, 16:25:40", "remaining_time": "0:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29900, "total_steps": 30076, "loss": 0.3647, "learning_rate": 1.043128119184167e-08, "epoch": 1.9881971573435293, "percentage": 99.41, "elapsed_time": "2 days, 16:31:52", "remaining_time": "0:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29950, "total_steps": 30076, "loss": 0.4068, "learning_rate": 5.346391637583992e-09, "epoch": 1.9915219017538028, "percentage": 99.58, "elapsed_time": "2 days, 16:38:18", "remaining_time": "0:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30000, "total_steps": 30076, "loss": 0.4035, "learning_rate": 1.945144130788279e-09, "epoch": 1.9948466461640761, "percentage": 99.75, "elapsed_time": "2 days, 16:44:41", "remaining_time": "0:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30000, "total_steps": 30076, "eval_loss": 0.3463568687438965, "epoch": 1.9948466461640761, "percentage": 99.75, "elapsed_time": "2 days, 17:57:35", "remaining_time": "0:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30050, "total_steps": 30076, "loss": 0.3829, "learning_rate": 2.2765321335826983e-10, "epoch": 1.9981713905743494, "percentage": 99.91, "elapsed_time": "2 days, 18:03:43", "remaining_time": "0:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30076, "total_steps": 30076, "epoch": 1.9999002576676919, "percentage": 100.0, "elapsed_time": "2 days, 18:07:13", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}