full_reviewer_7b / trainer_log.jsonl
sumuks's picture
Training in progress, step 3537
57dcbb4 verified
{"current_steps": 10, "total_steps": 3537, "loss": 2.0351, "lr": 1.4124293785310734e-06, "epoch": 0.008481764206955046, "percentage": 0.28, "elapsed_time": "0:00:20", "remaining_time": "2:03:10"}
{"current_steps": 20, "total_steps": 3537, "loss": 1.9766, "lr": 2.824858757062147e-06, "epoch": 0.016963528413910092, "percentage": 0.57, "elapsed_time": "0:00:41", "remaining_time": "2:01:12"}
{"current_steps": 30, "total_steps": 3537, "loss": 1.951, "lr": 4.23728813559322e-06, "epoch": 0.02544529262086514, "percentage": 0.85, "elapsed_time": "0:01:01", "remaining_time": "2:00:17"}
{"current_steps": 40, "total_steps": 3537, "loss": 1.8941, "lr": 5.649717514124294e-06, "epoch": 0.033927056827820185, "percentage": 1.13, "elapsed_time": "0:01:22", "remaining_time": "1:59:41"}
{"current_steps": 50, "total_steps": 3537, "loss": 1.8506, "lr": 7.062146892655368e-06, "epoch": 0.04240882103477523, "percentage": 1.41, "elapsed_time": "0:01:42", "remaining_time": "1:59:11"}
{"current_steps": 60, "total_steps": 3537, "loss": 1.8052, "lr": 8.47457627118644e-06, "epoch": 0.05089058524173028, "percentage": 1.7, "elapsed_time": "0:02:02", "remaining_time": "1:58:45"}
{"current_steps": 70, "total_steps": 3537, "loss": 1.8038, "lr": 9.887005649717516e-06, "epoch": 0.05937234944868533, "percentage": 1.98, "elapsed_time": "0:02:23", "remaining_time": "1:58:20"}
{"current_steps": 80, "total_steps": 3537, "loss": 1.7649, "lr": 1.1299435028248587e-05, "epoch": 0.06785411365564037, "percentage": 2.26, "elapsed_time": "0:02:43", "remaining_time": "1:57:57"}
{"current_steps": 90, "total_steps": 3537, "loss": 1.7458, "lr": 1.2711864406779661e-05, "epoch": 0.07633587786259542, "percentage": 2.54, "elapsed_time": "0:03:04", "remaining_time": "1:57:34"}
{"current_steps": 100, "total_steps": 3537, "loss": 1.75, "lr": 1.4124293785310736e-05, "epoch": 0.08481764206955046, "percentage": 2.83, "elapsed_time": "0:03:24", "remaining_time": "1:57:11"}
{"current_steps": 110, "total_steps": 3537, "loss": 1.7462, "lr": 1.553672316384181e-05, "epoch": 0.09329940627650551, "percentage": 3.11, "elapsed_time": "0:03:44", "remaining_time": "1:56:48"}
{"current_steps": 120, "total_steps": 3537, "loss": 1.7414, "lr": 1.694915254237288e-05, "epoch": 0.10178117048346055, "percentage": 3.39, "elapsed_time": "0:04:05", "remaining_time": "1:56:25"}
{"current_steps": 130, "total_steps": 3537, "loss": 1.7446, "lr": 1.8361581920903956e-05, "epoch": 0.1102629346904156, "percentage": 3.68, "elapsed_time": "0:04:25", "remaining_time": "1:56:02"}
{"current_steps": 140, "total_steps": 3537, "loss": 1.7285, "lr": 1.977401129943503e-05, "epoch": 0.11874469889737066, "percentage": 3.96, "elapsed_time": "0:04:45", "remaining_time": "1:55:39"}
{"current_steps": 150, "total_steps": 3537, "loss": 1.7406, "lr": 2.1186440677966103e-05, "epoch": 0.1272264631043257, "percentage": 4.24, "elapsed_time": "0:05:06", "remaining_time": "1:55:16"}
{"current_steps": 160, "total_steps": 3537, "loss": 1.7338, "lr": 2.2598870056497175e-05, "epoch": 0.13570822731128074, "percentage": 4.52, "elapsed_time": "0:05:26", "remaining_time": "1:54:53"}
{"current_steps": 170, "total_steps": 3537, "loss": 1.7048, "lr": 2.401129943502825e-05, "epoch": 0.1441899915182358, "percentage": 4.81, "elapsed_time": "0:05:46", "remaining_time": "1:54:31"}
{"current_steps": 180, "total_steps": 3537, "loss": 1.729, "lr": 2.5423728813559322e-05, "epoch": 0.15267175572519084, "percentage": 5.09, "elapsed_time": "0:06:07", "remaining_time": "1:54:08"}
{"current_steps": 190, "total_steps": 3537, "loss": 1.7157, "lr": 2.68361581920904e-05, "epoch": 0.16115351993214588, "percentage": 5.37, "elapsed_time": "0:06:27", "remaining_time": "1:53:46"}
{"current_steps": 200, "total_steps": 3537, "loss": 1.7065, "lr": 2.8248587570621472e-05, "epoch": 0.16963528413910092, "percentage": 5.65, "elapsed_time": "0:06:47", "remaining_time": "1:53:25"}
{"current_steps": 210, "total_steps": 3537, "loss": 1.7147, "lr": 2.9661016949152544e-05, "epoch": 0.178117048346056, "percentage": 5.94, "elapsed_time": "0:07:08", "remaining_time": "1:53:03"}
{"current_steps": 220, "total_steps": 3537, "loss": 1.7245, "lr": 3.107344632768362e-05, "epoch": 0.18659881255301103, "percentage": 6.22, "elapsed_time": "0:07:28", "remaining_time": "1:52:41"}
{"current_steps": 230, "total_steps": 3537, "loss": 1.7045, "lr": 3.2485875706214694e-05, "epoch": 0.19508057675996607, "percentage": 6.5, "elapsed_time": "0:07:48", "remaining_time": "1:52:19"}
{"current_steps": 240, "total_steps": 3537, "loss": 1.6859, "lr": 3.389830508474576e-05, "epoch": 0.2035623409669211, "percentage": 6.79, "elapsed_time": "0:08:09", "remaining_time": "1:51:58"}
{"current_steps": 250, "total_steps": 3537, "loss": 1.7053, "lr": 3.531073446327684e-05, "epoch": 0.21204410517387617, "percentage": 7.07, "elapsed_time": "0:08:29", "remaining_time": "1:51:37"}
{"current_steps": 260, "total_steps": 3537, "loss": 1.6977, "lr": 3.672316384180791e-05, "epoch": 0.2205258693808312, "percentage": 7.35, "elapsed_time": "0:08:49", "remaining_time": "1:51:15"}
{"current_steps": 270, "total_steps": 3537, "loss": 1.7306, "lr": 3.813559322033898e-05, "epoch": 0.22900763358778625, "percentage": 7.63, "elapsed_time": "0:09:09", "remaining_time": "1:50:54"}
{"current_steps": 280, "total_steps": 3537, "loss": 1.688, "lr": 3.954802259887006e-05, "epoch": 0.23748939779474132, "percentage": 7.92, "elapsed_time": "0:09:30", "remaining_time": "1:50:33"}
{"current_steps": 290, "total_steps": 3537, "loss": 1.6959, "lr": 4.096045197740113e-05, "epoch": 0.24597116200169636, "percentage": 8.2, "elapsed_time": "0:09:50", "remaining_time": "1:50:12"}
{"current_steps": 300, "total_steps": 3537, "loss": 1.7084, "lr": 4.2372881355932206e-05, "epoch": 0.2544529262086514, "percentage": 8.48, "elapsed_time": "0:10:10", "remaining_time": "1:49:51"}
{"current_steps": 310, "total_steps": 3537, "loss": 1.6758, "lr": 4.378531073446328e-05, "epoch": 0.26293469041560646, "percentage": 8.76, "elapsed_time": "0:10:31", "remaining_time": "1:49:30"}
{"current_steps": 320, "total_steps": 3537, "loss": 1.7053, "lr": 4.519774011299435e-05, "epoch": 0.2714164546225615, "percentage": 9.05, "elapsed_time": "0:10:51", "remaining_time": "1:49:09"}
{"current_steps": 330, "total_steps": 3537, "loss": 1.7106, "lr": 4.6610169491525425e-05, "epoch": 0.27989821882951654, "percentage": 9.33, "elapsed_time": "0:11:11", "remaining_time": "1:48:48"}
{"current_steps": 340, "total_steps": 3537, "loss": 1.6952, "lr": 4.80225988700565e-05, "epoch": 0.2883799830364716, "percentage": 9.61, "elapsed_time": "0:11:32", "remaining_time": "1:48:27"}
{"current_steps": 350, "total_steps": 3537, "loss": 1.7141, "lr": 4.9435028248587575e-05, "epoch": 0.2968617472434266, "percentage": 9.9, "elapsed_time": "0:11:52", "remaining_time": "1:48:07"}
{"current_steps": 360, "total_steps": 3537, "loss": 1.6916, "lr": 4.999956163314189e-05, "epoch": 0.3053435114503817, "percentage": 10.18, "elapsed_time": "0:12:12", "remaining_time": "1:47:46"}
{"current_steps": 370, "total_steps": 3537, "loss": 1.6689, "lr": 4.9996882780236966e-05, "epoch": 0.3138252756573367, "percentage": 10.46, "elapsed_time": "0:12:33", "remaining_time": "1:47:25"}
{"current_steps": 380, "total_steps": 3537, "loss": 1.6957, "lr": 4.99917688722129e-05, "epoch": 0.32230703986429177, "percentage": 10.74, "elapsed_time": "0:12:53", "remaining_time": "1:47:04"}
{"current_steps": 390, "total_steps": 3537, "loss": 1.6925, "lr": 4.9984220407237743e-05, "epoch": 0.33078880407124683, "percentage": 11.03, "elapsed_time": "0:13:13", "remaining_time": "1:46:43"}
{"current_steps": 400, "total_steps": 3537, "loss": 1.7053, "lr": 4.997423812064029e-05, "epoch": 0.33927056827820185, "percentage": 11.31, "elapsed_time": "0:13:33", "remaining_time": "1:46:23"}
{"current_steps": 410, "total_steps": 3537, "loss": 1.6835, "lr": 4.996182298483854e-05, "epoch": 0.3477523324851569, "percentage": 11.59, "elapsed_time": "0:13:54", "remaining_time": "1:46:02"}
{"current_steps": 420, "total_steps": 3537, "loss": 1.6833, "lr": 4.9946976209244876e-05, "epoch": 0.356234096692112, "percentage": 11.87, "elapsed_time": "0:14:14", "remaining_time": "1:45:41"}
{"current_steps": 430, "total_steps": 3537, "loss": 1.6965, "lr": 4.992969924014831e-05, "epoch": 0.364715860899067, "percentage": 12.16, "elapsed_time": "0:14:34", "remaining_time": "1:45:21"}
{"current_steps": 440, "total_steps": 3537, "loss": 1.6797, "lr": 4.990999376057358e-05, "epoch": 0.37319762510602206, "percentage": 12.44, "elapsed_time": "0:14:55", "remaining_time": "1:45:00"}
{"current_steps": 450, "total_steps": 3537, "loss": 1.7047, "lr": 4.98878616901172e-05, "epoch": 0.3816793893129771, "percentage": 12.72, "elapsed_time": "0:15:15", "remaining_time": "1:44:40"}
{"current_steps": 460, "total_steps": 3537, "loss": 1.6825, "lr": 4.986330518476046e-05, "epoch": 0.39016115351993214, "percentage": 13.01, "elapsed_time": "0:15:35", "remaining_time": "1:44:19"}
{"current_steps": 470, "total_steps": 3537, "loss": 1.6983, "lr": 4.983632663665937e-05, "epoch": 0.3986429177268872, "percentage": 13.29, "elapsed_time": "0:15:56", "remaining_time": "1:43:59"}
{"current_steps": 480, "total_steps": 3537, "loss": 1.6838, "lr": 4.980692867391172e-05, "epoch": 0.4071246819338422, "percentage": 13.57, "elapsed_time": "0:16:16", "remaining_time": "1:43:38"}
{"current_steps": 490, "total_steps": 3537, "loss": 1.6812, "lr": 4.9775114160300974e-05, "epoch": 0.4156064461407973, "percentage": 13.85, "elapsed_time": "0:16:36", "remaining_time": "1:43:17"}
{"current_steps": 500, "total_steps": 3537, "loss": 1.6934, "lr": 4.974088619501733e-05, "epoch": 0.42408821034775235, "percentage": 14.14, "elapsed_time": "0:16:57", "remaining_time": "1:42:57"}
{"current_steps": 510, "total_steps": 3537, "loss": 1.7084, "lr": 4.970424811235582e-05, "epoch": 0.43256997455470736, "percentage": 14.42, "elapsed_time": "0:17:40", "remaining_time": "1:44:54"}
{"current_steps": 520, "total_steps": 3537, "loss": 1.6919, "lr": 4.966520348139149e-05, "epoch": 0.4410517387616624, "percentage": 14.7, "elapsed_time": "0:18:00", "remaining_time": "1:44:30"}
{"current_steps": 530, "total_steps": 3537, "loss": 1.6909, "lr": 4.9623756105631755e-05, "epoch": 0.4495335029686175, "percentage": 14.98, "elapsed_time": "0:18:21", "remaining_time": "1:44:07"}
{"current_steps": 540, "total_steps": 3537, "loss": 1.6863, "lr": 4.9579910022645816e-05, "epoch": 0.4580152671755725, "percentage": 15.27, "elapsed_time": "0:18:41", "remaining_time": "1:43:44"}
{"current_steps": 550, "total_steps": 3537, "loss": 1.6877, "lr": 4.9533669503671417e-05, "epoch": 0.46649703138252757, "percentage": 15.55, "elapsed_time": "0:19:01", "remaining_time": "1:43:21"}
{"current_steps": 560, "total_steps": 3537, "loss": 1.6949, "lr": 4.94850390531987e-05, "epoch": 0.47497879558948264, "percentage": 15.83, "elapsed_time": "0:19:22", "remaining_time": "1:42:58"}
{"current_steps": 570, "total_steps": 3537, "loss": 1.6817, "lr": 4.943402340853146e-05, "epoch": 0.48346055979643765, "percentage": 16.12, "elapsed_time": "0:19:42", "remaining_time": "1:42:35"}
{"current_steps": 580, "total_steps": 3537, "loss": 1.6908, "lr": 4.938062753932562e-05, "epoch": 0.4919423240033927, "percentage": 16.4, "elapsed_time": "0:20:02", "remaining_time": "1:42:12"}
{"current_steps": 590, "total_steps": 3537, "loss": 1.685, "lr": 4.9324856647105144e-05, "epoch": 0.5004240882103478, "percentage": 16.68, "elapsed_time": "0:20:23", "remaining_time": "1:41:50"}
{"current_steps": 600, "total_steps": 3537, "loss": 1.6658, "lr": 4.9266716164755305e-05, "epoch": 0.5089058524173028, "percentage": 16.96, "elapsed_time": "0:20:43", "remaining_time": "1:41:27"}
{"current_steps": 600, "total_steps": 3537, "eval_loss": 1.6607000827789307, "epoch": 0.5089058524173028, "percentage": 16.96, "elapsed_time": "0:20:52", "remaining_time": "1:42:08"}
{"current_steps": 610, "total_steps": 3537, "loss": 1.6953, "lr": 4.920621175599348e-05, "epoch": 0.5173876166242578, "percentage": 17.25, "elapsed_time": "0:21:12", "remaining_time": "1:41:45"}
{"current_steps": 620, "total_steps": 3537, "loss": 1.6882, "lr": 4.9143349314817394e-05, "epoch": 0.5258693808312129, "percentage": 17.53, "elapsed_time": "0:21:32", "remaining_time": "1:41:21"}
{"current_steps": 630, "total_steps": 3537, "loss": 1.696, "lr": 4.9078134964930975e-05, "epoch": 0.5343511450381679, "percentage": 17.81, "elapsed_time": "0:21:52", "remaining_time": "1:40:58"}
{"current_steps": 640, "total_steps": 3537, "loss": 1.6657, "lr": 4.90105750591478e-05, "epoch": 0.542832909245123, "percentage": 18.09, "elapsed_time": "0:22:13", "remaining_time": "1:40:35"}
{"current_steps": 650, "total_steps": 3537, "loss": 1.6583, "lr": 4.894067617877227e-05, "epoch": 0.5513146734520781, "percentage": 18.38, "elapsed_time": "0:22:33", "remaining_time": "1:40:11"}
{"current_steps": 660, "total_steps": 3537, "loss": 1.6808, "lr": 4.886844513295846e-05, "epoch": 0.5597964376590331, "percentage": 18.66, "elapsed_time": "0:22:53", "remaining_time": "1:39:48"}
{"current_steps": 670, "total_steps": 3537, "loss": 1.6988, "lr": 4.8793888958046855e-05, "epoch": 0.5682782018659881, "percentage": 18.94, "elapsed_time": "0:23:14", "remaining_time": "1:39:25"}
{"current_steps": 680, "total_steps": 3537, "loss": 1.6782, "lr": 4.871701491687884e-05, "epoch": 0.5767599660729432, "percentage": 19.23, "elapsed_time": "0:23:34", "remaining_time": "1:39:02"}
{"current_steps": 690, "total_steps": 3537, "loss": 1.6755, "lr": 4.863783049808929e-05, "epoch": 0.5852417302798982, "percentage": 19.51, "elapsed_time": "0:23:54", "remaining_time": "1:38:39"}
{"current_steps": 700, "total_steps": 3537, "loss": 1.6832, "lr": 4.855634341537697e-05, "epoch": 0.5937234944868532, "percentage": 19.79, "elapsed_time": "0:24:15", "remaining_time": "1:38:17"}
{"current_steps": 710, "total_steps": 3537, "loss": 1.6524, "lr": 4.847256160675319e-05, "epoch": 0.6022052586938084, "percentage": 20.07, "elapsed_time": "0:24:35", "remaining_time": "1:37:54"}
{"current_steps": 720, "total_steps": 3537, "loss": 1.6641, "lr": 4.8386493233768465e-05, "epoch": 0.6106870229007634, "percentage": 20.36, "elapsed_time": "0:24:55", "remaining_time": "1:37:31"}
{"current_steps": 730, "total_steps": 3537, "loss": 1.6616, "lr": 4.829814668071752e-05, "epoch": 0.6191687871077184, "percentage": 20.64, "elapsed_time": "0:25:15", "remaining_time": "1:37:09"}
{"current_steps": 740, "total_steps": 3537, "loss": 1.7041, "lr": 4.820753055382253e-05, "epoch": 0.6276505513146734, "percentage": 20.92, "elapsed_time": "0:25:36", "remaining_time": "1:36:46"}
{"current_steps": 750, "total_steps": 3537, "loss": 1.6773, "lr": 4.811465368039467e-05, "epoch": 0.6361323155216285, "percentage": 21.2, "elapsed_time": "0:25:56", "remaining_time": "1:36:24"}
{"current_steps": 760, "total_steps": 3537, "loss": 1.6619, "lr": 4.801952510797433e-05, "epoch": 0.6446140797285835, "percentage": 21.49, "elapsed_time": "0:26:16", "remaining_time": "1:36:01"}
{"current_steps": 770, "total_steps": 3537, "loss": 1.6967, "lr": 4.792215410344968e-05, "epoch": 0.6530958439355385, "percentage": 21.77, "elapsed_time": "0:26:37", "remaining_time": "1:35:39"}
{"current_steps": 780, "total_steps": 3537, "loss": 1.657, "lr": 4.7822550152153946e-05, "epoch": 0.6615776081424937, "percentage": 22.05, "elapsed_time": "0:26:57", "remaining_time": "1:35:17"}
{"current_steps": 790, "total_steps": 3537, "loss": 1.6645, "lr": 4.7720722956941434e-05, "epoch": 0.6700593723494487, "percentage": 22.34, "elapsed_time": "0:27:17", "remaining_time": "1:34:55"}
{"current_steps": 800, "total_steps": 3537, "loss": 1.6618, "lr": 4.7616682437242295e-05, "epoch": 0.6785411365564037, "percentage": 22.62, "elapsed_time": "0:27:38", "remaining_time": "1:34:32"}
{"current_steps": 810, "total_steps": 3537, "loss": 1.6689, "lr": 4.751043872809626e-05, "epoch": 0.6870229007633588, "percentage": 22.9, "elapsed_time": "0:27:58", "remaining_time": "1:34:10"}
{"current_steps": 820, "total_steps": 3537, "loss": 1.6751, "lr": 4.740200217916534e-05, "epoch": 0.6955046649703138, "percentage": 23.18, "elapsed_time": "0:28:18", "remaining_time": "1:33:48"}
{"current_steps": 830, "total_steps": 3537, "loss": 1.6549, "lr": 4.729138335372558e-05, "epoch": 0.7039864291772688, "percentage": 23.47, "elapsed_time": "0:28:39", "remaining_time": "1:33:26"}
{"current_steps": 840, "total_steps": 3537, "loss": 1.6528, "lr": 4.717859302763812e-05, "epoch": 0.712468193384224, "percentage": 23.75, "elapsed_time": "0:28:59", "remaining_time": "1:33:04"}
{"current_steps": 850, "total_steps": 3537, "loss": 1.6689, "lr": 4.7063642188299384e-05, "epoch": 0.720949957591179, "percentage": 24.03, "elapsed_time": "0:29:19", "remaining_time": "1:32:42"}
{"current_steps": 860, "total_steps": 3537, "loss": 1.696, "lr": 4.694654203357082e-05, "epoch": 0.729431721798134, "percentage": 24.31, "elapsed_time": "0:29:40", "remaining_time": "1:32:21"}
{"current_steps": 870, "total_steps": 3537, "loss": 1.6834, "lr": 4.682730397068803e-05, "epoch": 0.7379134860050891, "percentage": 24.6, "elapsed_time": "0:30:00", "remaining_time": "1:31:59"}
{"current_steps": 880, "total_steps": 3537, "loss": 1.653, "lr": 4.670593961514955e-05, "epoch": 0.7463952502120441, "percentage": 24.88, "elapsed_time": "0:30:20", "remaining_time": "1:31:37"}
{"current_steps": 890, "total_steps": 3537, "loss": 1.6716, "lr": 4.658246078958534e-05, "epoch": 0.7548770144189991, "percentage": 25.16, "elapsed_time": "0:30:41", "remaining_time": "1:31:15"}
{"current_steps": 900, "total_steps": 3537, "loss": 1.6456, "lr": 4.645687952260508e-05, "epoch": 0.7633587786259542, "percentage": 25.45, "elapsed_time": "0:31:01", "remaining_time": "1:30:53"}
{"current_steps": 910, "total_steps": 3537, "loss": 1.6783, "lr": 4.6329208047626425e-05, "epoch": 0.7718405428329093, "percentage": 25.73, "elapsed_time": "0:31:21", "remaining_time": "1:30:32"}
{"current_steps": 920, "total_steps": 3537, "loss": 1.6748, "lr": 4.619945880168329e-05, "epoch": 0.7803223070398643, "percentage": 26.01, "elapsed_time": "0:31:41", "remaining_time": "1:30:10"}
{"current_steps": 930, "total_steps": 3537, "loss": 1.6767, "lr": 4.6067644424214286e-05, "epoch": 0.7888040712468194, "percentage": 26.29, "elapsed_time": "0:32:02", "remaining_time": "1:29:48"}
{"current_steps": 940, "total_steps": 3537, "loss": 1.6971, "lr": 4.5933777755831474e-05, "epoch": 0.7972858354537744, "percentage": 26.58, "elapsed_time": "0:32:22", "remaining_time": "1:29:27"}
{"current_steps": 950, "total_steps": 3537, "loss": 1.6897, "lr": 4.579787183706952e-05, "epoch": 0.8057675996607294, "percentage": 26.86, "elapsed_time": "0:32:42", "remaining_time": "1:29:05"}
{"current_steps": 960, "total_steps": 3537, "loss": 1.6722, "lr": 4.565993990711531e-05, "epoch": 0.8142493638676844, "percentage": 27.14, "elapsed_time": "0:33:03", "remaining_time": "1:28:43"}
{"current_steps": 970, "total_steps": 3537, "loss": 1.6464, "lr": 4.551999540251834e-05, "epoch": 0.8227311280746396, "percentage": 27.42, "elapsed_time": "0:33:23", "remaining_time": "1:28:22"}
{"current_steps": 980, "total_steps": 3537, "loss": 1.6734, "lr": 4.537805195588172e-05, "epoch": 0.8312128922815946, "percentage": 27.71, "elapsed_time": "0:33:43", "remaining_time": "1:28:00"}
{"current_steps": 990, "total_steps": 3537, "loss": 1.6824, "lr": 4.523412339453422e-05, "epoch": 0.8396946564885496, "percentage": 27.99, "elapsed_time": "0:34:04", "remaining_time": "1:27:39"}
{"current_steps": 1000, "total_steps": 3537, "loss": 1.6659, "lr": 4.508822373918328e-05, "epoch": 0.8481764206955047, "percentage": 28.27, "elapsed_time": "0:34:24", "remaining_time": "1:27:17"}
{"current_steps": 1010, "total_steps": 3537, "loss": 1.6707, "lr": 4.494036720254915e-05, "epoch": 0.8566581849024597, "percentage": 28.56, "elapsed_time": "0:35:07", "remaining_time": "1:27:53"}
{"current_steps": 1020, "total_steps": 3537, "loss": 1.6561, "lr": 4.479056818798044e-05, "epoch": 0.8651399491094147, "percentage": 28.84, "elapsed_time": "0:35:28", "remaining_time": "1:27:31"}
{"current_steps": 1030, "total_steps": 3537, "loss": 1.6344, "lr": 4.463884128805097e-05, "epoch": 0.8736217133163698, "percentage": 29.12, "elapsed_time": "0:35:48", "remaining_time": "1:27:08"}
{"current_steps": 1040, "total_steps": 3537, "loss": 1.6583, "lr": 4.448520128313826e-05, "epoch": 0.8821034775233249, "percentage": 29.4, "elapsed_time": "0:36:08", "remaining_time": "1:26:46"}
{"current_steps": 1050, "total_steps": 3537, "loss": 1.6674, "lr": 4.432966313998371e-05, "epoch": 0.8905852417302799, "percentage": 29.69, "elapsed_time": "0:36:28", "remaining_time": "1:26:24"}
{"current_steps": 1060, "total_steps": 3537, "loss": 1.6522, "lr": 4.4172242010234643e-05, "epoch": 0.899067005937235, "percentage": 29.97, "elapsed_time": "0:36:49", "remaining_time": "1:26:02"}
{"current_steps": 1070, "total_steps": 3537, "loss": 1.6563, "lr": 4.401295322896827e-05, "epoch": 0.90754877014419, "percentage": 30.25, "elapsed_time": "0:37:09", "remaining_time": "1:25:40"}
{"current_steps": 1080, "total_steps": 3537, "loss": 1.6677, "lr": 4.385181231319788e-05, "epoch": 0.916030534351145, "percentage": 30.53, "elapsed_time": "0:37:30", "remaining_time": "1:25:18"}
{"current_steps": 1090, "total_steps": 3537, "loss": 1.6784, "lr": 4.368883496036125e-05, "epoch": 0.9245122985581001, "percentage": 30.82, "elapsed_time": "0:37:50", "remaining_time": "1:24:56"}
{"current_steps": 1100, "total_steps": 3537, "loss": 1.6565, "lr": 4.3524037046791455e-05, "epoch": 0.9329940627650551, "percentage": 31.1, "elapsed_time": "0:38:10", "remaining_time": "1:24:34"}
{"current_steps": 1110, "total_steps": 3537, "loss": 1.6514, "lr": 4.335743462617036e-05, "epoch": 0.9414758269720102, "percentage": 31.38, "elapsed_time": "0:38:31", "remaining_time": "1:24:13"}
{"current_steps": 1120, "total_steps": 3537, "loss": 1.6546, "lr": 4.318904392796467e-05, "epoch": 0.9499575911789653, "percentage": 31.67, "elapsed_time": "0:38:51", "remaining_time": "1:23:51"}
{"current_steps": 1130, "total_steps": 3537, "loss": 1.6445, "lr": 4.3018881355844996e-05, "epoch": 0.9584393553859203, "percentage": 31.95, "elapsed_time": "0:39:11", "remaining_time": "1:23:29"}
{"current_steps": 1140, "total_steps": 3537, "loss": 1.665, "lr": 4.2846963486087926e-05, "epoch": 0.9669211195928753, "percentage": 32.23, "elapsed_time": "0:39:31", "remaining_time": "1:23:07"}
{"current_steps": 1150, "total_steps": 3537, "loss": 1.6917, "lr": 4.2673307065961196e-05, "epoch": 0.9754028837998303, "percentage": 32.51, "elapsed_time": "0:39:52", "remaining_time": "1:22:45"}
{"current_steps": 1160, "total_steps": 3537, "loss": 1.6593, "lr": 4.249792901209233e-05, "epoch": 0.9838846480067854, "percentage": 32.8, "elapsed_time": "0:40:12", "remaining_time": "1:22:23"}
{"current_steps": 1170, "total_steps": 3537, "loss": 1.6515, "lr": 4.2320846408820644e-05, "epoch": 0.9923664122137404, "percentage": 33.08, "elapsed_time": "0:40:32", "remaining_time": "1:22:01"}
{"current_steps": 1180, "total_steps": 3537, "loss": 1.6132, "lr": 4.214207650653306e-05, "epoch": 1.0008481764206956, "percentage": 33.36, "elapsed_time": "0:40:53", "remaining_time": "1:21:40"}
{"current_steps": 1190, "total_steps": 3537, "loss": 1.6052, "lr": 4.196163671998364e-05, "epoch": 1.0093299406276506, "percentage": 33.64, "elapsed_time": "0:41:13", "remaining_time": "1:21:18"}
{"current_steps": 1200, "total_steps": 3537, "loss": 1.5992, "lr": 4.1779544626597125e-05, "epoch": 1.0178117048346056, "percentage": 33.93, "elapsed_time": "0:41:33", "remaining_time": "1:20:56"}
{"current_steps": 1200, "total_steps": 3537, "eval_loss": 1.6405301094055176, "epoch": 1.0178117048346056, "percentage": 33.93, "elapsed_time": "0:41:42", "remaining_time": "1:21:13"}
{"current_steps": 1210, "total_steps": 3537, "loss": 1.6427, "lr": 4.159581796475665e-05, "epoch": 1.0262934690415606, "percentage": 34.21, "elapsed_time": "0:42:02", "remaining_time": "1:20:51"}
{"current_steps": 1220, "total_steps": 3537, "loss": 1.6227, "lr": 4.1410474632075794e-05, "epoch": 1.0347752332485156, "percentage": 34.49, "elapsed_time": "0:42:22", "remaining_time": "1:20:29"}
{"current_steps": 1230, "total_steps": 3537, "loss": 1.6279, "lr": 4.122353268365507e-05, "epoch": 1.0432569974554706, "percentage": 34.78, "elapsed_time": "0:42:43", "remaining_time": "1:20:07"}
{"current_steps": 1240, "total_steps": 3537, "loss": 1.6102, "lr": 4.1035010330323086e-05, "epoch": 1.0517387616624259, "percentage": 35.06, "elapsed_time": "0:43:03", "remaining_time": "1:19:45"}
{"current_steps": 1250, "total_steps": 3537, "loss": 1.6443, "lr": 4.084492593686261e-05, "epoch": 1.0602205258693809, "percentage": 35.34, "elapsed_time": "0:43:23", "remaining_time": "1:19:23"}
{"current_steps": 1260, "total_steps": 3537, "loss": 1.6221, "lr": 4.0653298020221496e-05, "epoch": 1.0687022900763359, "percentage": 35.62, "elapsed_time": "0:43:44", "remaining_time": "1:19:02"}
{"current_steps": 1270, "total_steps": 3537, "loss": 1.635, "lr": 4.046014524770893e-05, "epoch": 1.077184054283291, "percentage": 35.91, "elapsed_time": "0:44:04", "remaining_time": "1:18:40"}
{"current_steps": 1280, "total_steps": 3537, "loss": 1.6255, "lr": 4.026548643517694e-05, "epoch": 1.085665818490246, "percentage": 36.19, "elapsed_time": "0:44:24", "remaining_time": "1:18:18"}
{"current_steps": 1290, "total_steps": 3537, "loss": 1.5958, "lr": 4.006934054518745e-05, "epoch": 1.094147582697201, "percentage": 36.47, "elapsed_time": "0:44:44", "remaining_time": "1:17:56"}
{"current_steps": 1300, "total_steps": 3537, "loss": 1.6374, "lr": 3.98717266851651e-05, "epoch": 1.1026293469041561, "percentage": 36.75, "elapsed_time": "0:45:05", "remaining_time": "1:17:35"}
{"current_steps": 1310, "total_steps": 3537, "loss": 1.6139, "lr": 3.967266410553584e-05, "epoch": 1.1111111111111112, "percentage": 37.04, "elapsed_time": "0:45:25", "remaining_time": "1:17:13"}
{"current_steps": 1320, "total_steps": 3537, "loss": 1.6291, "lr": 3.947217219785174e-05, "epoch": 1.1195928753180662, "percentage": 37.32, "elapsed_time": "0:45:45", "remaining_time": "1:16:51"}
{"current_steps": 1330, "total_steps": 3537, "loss": 1.6286, "lr": 3.92702704929019e-05, "epoch": 1.1280746395250212, "percentage": 37.6, "elapsed_time": "0:46:06", "remaining_time": "1:16:30"}
{"current_steps": 1340, "total_steps": 3537, "loss": 1.6168, "lr": 3.906697865880995e-05, "epoch": 1.1365564037319762, "percentage": 37.89, "elapsed_time": "0:46:26", "remaining_time": "1:16:08"}
{"current_steps": 1350, "total_steps": 3537, "loss": 1.6463, "lr": 3.886231649911799e-05, "epoch": 1.1450381679389312, "percentage": 38.17, "elapsed_time": "0:46:46", "remaining_time": "1:15:46"}
{"current_steps": 1360, "total_steps": 3537, "loss": 1.6448, "lr": 3.865630395085754e-05, "epoch": 1.1535199321458864, "percentage": 38.45, "elapsed_time": "0:47:07", "remaining_time": "1:15:25"}
{"current_steps": 1370, "total_steps": 3537, "loss": 1.6236, "lr": 3.8448961082607346e-05, "epoch": 1.1620016963528415, "percentage": 38.73, "elapsed_time": "0:47:27", "remaining_time": "1:15:03"}
{"current_steps": 1380, "total_steps": 3537, "loss": 1.6289, "lr": 3.82403080925384e-05, "epoch": 1.1704834605597965, "percentage": 39.02, "elapsed_time": "0:47:47", "remaining_time": "1:14:42"}
{"current_steps": 1390, "total_steps": 3537, "loss": 1.6059, "lr": 3.803036530644636e-05, "epoch": 1.1789652247667515, "percentage": 39.3, "elapsed_time": "0:48:07", "remaining_time": "1:14:20"}
{"current_steps": 1400, "total_steps": 3537, "loss": 1.6339, "lr": 3.7819153175771524e-05, "epoch": 1.1874469889737065, "percentage": 39.58, "elapsed_time": "0:48:28", "remaining_time": "1:13:59"}
{"current_steps": 1410, "total_steps": 3537, "loss": 1.6112, "lr": 3.7606692275606596e-05, "epoch": 1.1959287531806615, "percentage": 39.86, "elapsed_time": "0:48:48", "remaining_time": "1:13:37"}
{"current_steps": 1420, "total_steps": 3537, "loss": 1.6095, "lr": 3.739300330269232e-05, "epoch": 1.2044105173876165, "percentage": 40.15, "elapsed_time": "0:49:08", "remaining_time": "1:13:16"}
{"current_steps": 1430, "total_steps": 3537, "loss": 1.602, "lr": 3.7178107073401356e-05, "epoch": 1.2128922815945717, "percentage": 40.43, "elapsed_time": "0:49:29", "remaining_time": "1:12:54"}
{"current_steps": 1440, "total_steps": 3537, "loss": 1.6087, "lr": 3.696202452171047e-05, "epoch": 1.2213740458015268, "percentage": 40.71, "elapsed_time": "0:49:49", "remaining_time": "1:12:33"}
{"current_steps": 1450, "total_steps": 3537, "loss": 1.6143, "lr": 3.674477669716125e-05, "epoch": 1.2298558100084818, "percentage": 41.0, "elapsed_time": "0:50:09", "remaining_time": "1:12:11"}
{"current_steps": 1460, "total_steps": 3537, "loss": 1.6236, "lr": 3.6526384762809574e-05, "epoch": 1.2383375742154368, "percentage": 41.28, "elapsed_time": "0:50:30", "remaining_time": "1:11:50"}
{"current_steps": 1470, "total_steps": 3537, "loss": 1.6271, "lr": 3.630686999316406e-05, "epoch": 1.2468193384223918, "percentage": 41.56, "elapsed_time": "0:50:50", "remaining_time": "1:11:29"}
{"current_steps": 1480, "total_steps": 3537, "loss": 1.6396, "lr": 3.608625377211357e-05, "epoch": 1.255301102629347, "percentage": 41.84, "elapsed_time": "0:51:10", "remaining_time": "1:11:07"}
{"current_steps": 1490, "total_steps": 3537, "loss": 1.5935, "lr": 3.5864557590844164e-05, "epoch": 1.263782866836302, "percentage": 42.13, "elapsed_time": "0:51:30", "remaining_time": "1:10:46"}
{"current_steps": 1500, "total_steps": 3537, "loss": 1.6093, "lr": 3.564180304574549e-05, "epoch": 1.272264631043257, "percentage": 42.41, "elapsed_time": "0:51:51", "remaining_time": "1:10:24"}
{"current_steps": 1510, "total_steps": 3537, "loss": 1.6601, "lr": 3.541801183630706e-05, "epoch": 1.280746395250212, "percentage": 42.69, "elapsed_time": "0:52:32", "remaining_time": "1:10:32"}
{"current_steps": 1520, "total_steps": 3537, "loss": 1.6269, "lr": 3.519320576300436e-05, "epoch": 1.289228159457167, "percentage": 42.97, "elapsed_time": "0:52:53", "remaining_time": "1:10:10"}
{"current_steps": 1530, "total_steps": 3537, "loss": 1.6089, "lr": 3.4967406725175165e-05, "epoch": 1.297709923664122, "percentage": 43.26, "elapsed_time": "0:53:13", "remaining_time": "1:09:48"}
{"current_steps": 1540, "total_steps": 3537, "loss": 1.6189, "lr": 3.4740636718886264e-05, "epoch": 1.306191687871077, "percentage": 43.54, "elapsed_time": "0:53:33", "remaining_time": "1:09:27"}
{"current_steps": 1550, "total_steps": 3537, "loss": 1.6202, "lr": 3.45129178347907e-05, "epoch": 1.3146734520780323, "percentage": 43.82, "elapsed_time": "0:53:54", "remaining_time": "1:09:05"}
{"current_steps": 1560, "total_steps": 3537, "loss": 1.6241, "lr": 3.428427225597583e-05, "epoch": 1.3231552162849873, "percentage": 44.11, "elapsed_time": "0:54:14", "remaining_time": "1:08:44"}
{"current_steps": 1570, "total_steps": 3537, "loss": 1.6242, "lr": 3.405472225580238e-05, "epoch": 1.3316369804919423, "percentage": 44.39, "elapsed_time": "0:54:34", "remaining_time": "1:08:22"}
{"current_steps": 1580, "total_steps": 3537, "loss": 1.6077, "lr": 3.38242901957347e-05, "epoch": 1.3401187446988974, "percentage": 44.67, "elapsed_time": "0:54:55", "remaining_time": "1:08:01"}
{"current_steps": 1590, "total_steps": 3537, "loss": 1.6045, "lr": 3.359299852316242e-05, "epoch": 1.3486005089058524, "percentage": 44.95, "elapsed_time": "0:55:15", "remaining_time": "1:07:39"}
{"current_steps": 1600, "total_steps": 3537, "loss": 1.6098, "lr": 3.336086976921378e-05, "epoch": 1.3570822731128076, "percentage": 45.24, "elapsed_time": "0:55:35", "remaining_time": "1:07:18"}
{"current_steps": 1610, "total_steps": 3537, "loss": 1.6165, "lr": 3.312792654656073e-05, "epoch": 1.3655640373197624, "percentage": 45.52, "elapsed_time": "0:55:56", "remaining_time": "1:06:56"}
{"current_steps": 1620, "total_steps": 3537, "loss": 1.6013, "lr": 3.28941915472162e-05, "epoch": 1.3740458015267176, "percentage": 45.8, "elapsed_time": "0:56:16", "remaining_time": "1:06:35"}
{"current_steps": 1630, "total_steps": 3537, "loss": 1.5936, "lr": 3.2659687540323516e-05, "epoch": 1.3825275657336726, "percentage": 46.08, "elapsed_time": "0:56:36", "remaining_time": "1:06:13"}
{"current_steps": 1640, "total_steps": 3537, "loss": 1.5988, "lr": 3.242443736993837e-05, "epoch": 1.3910093299406276, "percentage": 46.37, "elapsed_time": "0:56:56", "remaining_time": "1:05:52"}
{"current_steps": 1650, "total_steps": 3537, "loss": 1.628, "lr": 3.218846395280349e-05, "epoch": 1.3994910941475827, "percentage": 46.65, "elapsed_time": "0:57:17", "remaining_time": "1:05:30"}
{"current_steps": 1660, "total_steps": 3537, "loss": 1.6094, "lr": 3.19517902761162e-05, "epoch": 1.4079728583545377, "percentage": 46.93, "elapsed_time": "0:57:37", "remaining_time": "1:05:09"}
{"current_steps": 1670, "total_steps": 3537, "loss": 1.6263, "lr": 3.171443939528919e-05, "epoch": 1.416454622561493, "percentage": 47.22, "elapsed_time": "0:57:57", "remaining_time": "1:04:48"}
{"current_steps": 1680, "total_steps": 3537, "loss": 1.5863, "lr": 3.147643443170454e-05, "epoch": 1.424936386768448, "percentage": 47.5, "elapsed_time": "0:58:18", "remaining_time": "1:04:26"}
{"current_steps": 1690, "total_steps": 3537, "loss": 1.5944, "lr": 3.123779857046134e-05, "epoch": 1.433418150975403, "percentage": 47.78, "elapsed_time": "0:58:38", "remaining_time": "1:04:05"}
{"current_steps": 1700, "total_steps": 3537, "loss": 1.6376, "lr": 3.0998555058117216e-05, "epoch": 1.441899915182358, "percentage": 48.06, "elapsed_time": "0:58:58", "remaining_time": "1:03:43"}
{"current_steps": 1710, "total_steps": 3537, "loss": 1.6132, "lr": 3.075872720042372e-05, "epoch": 1.450381679389313, "percentage": 48.35, "elapsed_time": "0:59:19", "remaining_time": "1:03:22"}
{"current_steps": 1720, "total_steps": 3537, "loss": 1.6218, "lr": 3.0518338360056e-05, "epoch": 1.458863443596268, "percentage": 48.63, "elapsed_time": "0:59:39", "remaining_time": "1:03:01"}
{"current_steps": 1730, "total_steps": 3537, "loss": 1.592, "lr": 3.0277411954337005e-05, "epoch": 1.467345207803223, "percentage": 48.91, "elapsed_time": "0:59:59", "remaining_time": "1:02:39"}
{"current_steps": 1740, "total_steps": 3537, "loss": 1.615, "lr": 3.0035971452956224e-05, "epoch": 1.4758269720101782, "percentage": 49.19, "elapsed_time": "1:00:20", "remaining_time": "1:02:18"}
{"current_steps": 1750, "total_steps": 3537, "loss": 1.6025, "lr": 2.9794040375683485e-05, "epoch": 1.4843087362171332, "percentage": 49.48, "elapsed_time": "1:00:40", "remaining_time": "1:01:57"}
{"current_steps": 1760, "total_steps": 3537, "loss": 1.6188, "lr": 2.9551642290077707e-05, "epoch": 1.4927905004240882, "percentage": 49.76, "elapsed_time": "1:01:00", "remaining_time": "1:01:36"}
{"current_steps": 1770, "total_steps": 3537, "loss": 1.6028, "lr": 2.9308800809191157e-05, "epoch": 1.5012722646310432, "percentage": 50.04, "elapsed_time": "1:01:20", "remaining_time": "1:01:14"}
{"current_steps": 1780, "total_steps": 3537, "loss": 1.6252, "lr": 2.9065539589269147e-05, "epoch": 1.5097540288379983, "percentage": 50.33, "elapsed_time": "1:01:41", "remaining_time": "1:00:53"}
{"current_steps": 1790, "total_steps": 3537, "loss": 1.6216, "lr": 2.8821882327445594e-05, "epoch": 1.5182357930449535, "percentage": 50.61, "elapsed_time": "1:02:01", "remaining_time": "1:00:32"}
{"current_steps": 1800, "total_steps": 3537, "loss": 1.6182, "lr": 2.857785275943458e-05, "epoch": 1.5267175572519083, "percentage": 50.89, "elapsed_time": "1:02:21", "remaining_time": "1:00:10"}
{"current_steps": 1800, "total_steps": 3537, "eval_loss": 1.6240788698196411, "epoch": 1.5267175572519083, "percentage": 50.89, "elapsed_time": "1:02:30", "remaining_time": "1:00:19"}
{"current_steps": 1810, "total_steps": 3537, "loss": 1.6002, "lr": 2.8333474657218174e-05, "epoch": 1.5351993214588635, "percentage": 51.17, "elapsed_time": "1:02:50", "remaining_time": "0:59:57"}
{"current_steps": 1820, "total_steps": 3537, "loss": 1.5973, "lr": 2.8088771826730643e-05, "epoch": 1.5436810856658185, "percentage": 51.46, "elapsed_time": "1:03:10", "remaining_time": "0:59:36"}
{"current_steps": 1830, "total_steps": 3537, "loss": 1.6262, "lr": 2.784376810553947e-05, "epoch": 1.5521628498727735, "percentage": 51.74, "elapsed_time": "1:03:31", "remaining_time": "0:59:14"}
{"current_steps": 1840, "total_steps": 3537, "loss": 1.5753, "lr": 2.759848736052321e-05, "epoch": 1.5606446140797285, "percentage": 52.02, "elapsed_time": "1:03:51", "remaining_time": "0:58:53"}
{"current_steps": 1850, "total_steps": 3537, "loss": 1.6209, "lr": 2.735295348554651e-05, "epoch": 1.5691263782866836, "percentage": 52.3, "elapsed_time": "1:04:11", "remaining_time": "0:58:32"}
{"current_steps": 1860, "total_steps": 3537, "loss": 1.6088, "lr": 2.7107190399132526e-05, "epoch": 1.5776081424936388, "percentage": 52.59, "elapsed_time": "1:04:32", "remaining_time": "0:58:11"}
{"current_steps": 1870, "total_steps": 3537, "loss": 1.6252, "lr": 2.686122204213285e-05, "epoch": 1.5860899067005936, "percentage": 52.87, "elapsed_time": "1:04:52", "remaining_time": "0:57:49"}
{"current_steps": 1880, "total_steps": 3537, "loss": 1.6112, "lr": 2.6615072375395423e-05, "epoch": 1.5945716709075488, "percentage": 53.15, "elapsed_time": "1:05:12", "remaining_time": "0:57:28"}
{"current_steps": 1890, "total_steps": 3537, "loss": 1.6146, "lr": 2.6368765377430344e-05, "epoch": 1.6030534351145038, "percentage": 53.44, "elapsed_time": "1:05:32", "remaining_time": "0:57:07"}
{"current_steps": 1900, "total_steps": 3537, "loss": 1.5834, "lr": 2.6122325042074014e-05, "epoch": 1.6115351993214588, "percentage": 53.72, "elapsed_time": "1:05:53", "remaining_time": "0:56:45"}
{"current_steps": 1910, "total_steps": 3537, "loss": 1.6151, "lr": 2.5875775376151823e-05, "epoch": 1.620016963528414, "percentage": 54.0, "elapsed_time": "1:06:13", "remaining_time": "0:56:24"}
{"current_steps": 1920, "total_steps": 3537, "loss": 1.5838, "lr": 2.562914039713953e-05, "epoch": 1.6284987277353689, "percentage": 54.28, "elapsed_time": "1:06:33", "remaining_time": "0:56:03"}
{"current_steps": 1930, "total_steps": 3537, "loss": 1.6254, "lr": 2.5382444130823612e-05, "epoch": 1.636980491942324, "percentage": 54.57, "elapsed_time": "1:06:54", "remaining_time": "0:55:42"}
{"current_steps": 1940, "total_steps": 3537, "loss": 1.5999, "lr": 2.5135710608960807e-05, "epoch": 1.645462256149279, "percentage": 54.85, "elapsed_time": "1:07:14", "remaining_time": "0:55:21"}
{"current_steps": 1950, "total_steps": 3537, "loss": 1.581, "lr": 2.4888963866937067e-05, "epoch": 1.6539440203562341, "percentage": 55.13, "elapsed_time": "1:07:34", "remaining_time": "0:54:59"}
{"current_steps": 1960, "total_steps": 3537, "loss": 1.6151, "lr": 2.464222794142619e-05, "epoch": 1.6624257845631891, "percentage": 55.41, "elapsed_time": "1:07:55", "remaining_time": "0:54:38"}
{"current_steps": 1970, "total_steps": 3537, "loss": 1.6062, "lr": 2.43955268680483e-05, "epoch": 1.6709075487701441, "percentage": 55.7, "elapsed_time": "1:08:15", "remaining_time": "0:54:17"}
{"current_steps": 1980, "total_steps": 3537, "loss": 1.6096, "lr": 2.4148884679028402e-05, "epoch": 1.6793893129770994, "percentage": 55.98, "elapsed_time": "1:08:35", "remaining_time": "0:53:56"}
{"current_steps": 1990, "total_steps": 3537, "loss": 1.5932, "lr": 2.390232540085533e-05, "epoch": 1.6878710771840542, "percentage": 56.26, "elapsed_time": "1:08:56", "remaining_time": "0:53:35"}
{"current_steps": 2000, "total_steps": 3537, "loss": 1.5809, "lr": 2.3655873051941203e-05, "epoch": 1.6963528413910094, "percentage": 56.55, "elapsed_time": "1:09:16", "remaining_time": "0:53:14"}
{"current_steps": 2010, "total_steps": 3537, "loss": 1.5818, "lr": 2.340955164028171e-05, "epoch": 1.7048346055979644, "percentage": 56.83, "elapsed_time": "1:09:58", "remaining_time": "0:53:09"}
{"current_steps": 2020, "total_steps": 3537, "loss": 1.5911, "lr": 2.3163385161117367e-05, "epoch": 1.7133163698049194, "percentage": 57.11, "elapsed_time": "1:10:18", "remaining_time": "0:52:47"}
{"current_steps": 2030, "total_steps": 3537, "loss": 1.5816, "lr": 2.291739759459605e-05, "epoch": 1.7217981340118744, "percentage": 57.39, "elapsed_time": "1:10:38", "remaining_time": "0:52:26"}
{"current_steps": 2040, "total_steps": 3537, "loss": 1.6033, "lr": 2.267161290343694e-05, "epoch": 1.7302798982188294, "percentage": 57.68, "elapsed_time": "1:10:59", "remaining_time": "0:52:05"}
{"current_steps": 2050, "total_steps": 3537, "loss": 1.6122, "lr": 2.2426055030596282e-05, "epoch": 1.7387616624257847, "percentage": 57.96, "elapsed_time": "1:11:19", "remaining_time": "0:51:44"}
{"current_steps": 2060, "total_steps": 3537, "loss": 1.5995, "lr": 2.2180747896934956e-05, "epoch": 1.7472434266327395, "percentage": 58.24, "elapsed_time": "1:11:39", "remaining_time": "0:51:23"}
{"current_steps": 2070, "total_steps": 3537, "loss": 1.5938, "lr": 2.193571539888824e-05, "epoch": 1.7557251908396947, "percentage": 58.52, "elapsed_time": "1:12:00", "remaining_time": "0:51:01"}
{"current_steps": 2080, "total_steps": 3537, "loss": 1.5792, "lr": 2.169098140613797e-05, "epoch": 1.7642069550466497, "percentage": 58.81, "elapsed_time": "1:12:20", "remaining_time": "0:50:40"}
{"current_steps": 2090, "total_steps": 3537, "loss": 1.5856, "lr": 2.1446569759287267e-05, "epoch": 1.7726887192536047, "percentage": 59.09, "elapsed_time": "1:12:41", "remaining_time": "0:50:19"}
{"current_steps": 2100, "total_steps": 3537, "loss": 1.5875, "lr": 2.120250426753815e-05, "epoch": 1.78117048346056, "percentage": 59.37, "elapsed_time": "1:13:01", "remaining_time": "0:49:58"}
{"current_steps": 2110, "total_steps": 3537, "loss": 1.5909, "lr": 2.095880870637216e-05, "epoch": 1.7896522476675147, "percentage": 59.66, "elapsed_time": "1:13:21", "remaining_time": "0:49:36"}
{"current_steps": 2120, "total_steps": 3537, "loss": 1.5812, "lr": 2.071550681523429e-05, "epoch": 1.79813401187447, "percentage": 59.94, "elapsed_time": "1:13:42", "remaining_time": "0:49:15"}
{"current_steps": 2130, "total_steps": 3537, "loss": 1.5909, "lr": 2.0472622295220413e-05, "epoch": 1.806615776081425, "percentage": 60.22, "elapsed_time": "1:14:02", "remaining_time": "0:48:54"}
{"current_steps": 2140, "total_steps": 3537, "loss": 1.5852, "lr": 2.023017880676849e-05, "epoch": 1.81509754028838, "percentage": 60.5, "elapsed_time": "1:14:22", "remaining_time": "0:48:33"}
{"current_steps": 2150, "total_steps": 3537, "loss": 1.5997, "lr": 1.9988199967353642e-05, "epoch": 1.823579304495335, "percentage": 60.79, "elapsed_time": "1:14:42", "remaining_time": "0:48:12"}
{"current_steps": 2160, "total_steps": 3537, "loss": 1.6062, "lr": 1.974670934918753e-05, "epoch": 1.83206106870229, "percentage": 61.07, "elapsed_time": "1:15:03", "remaining_time": "0:47:50"}
{"current_steps": 2170, "total_steps": 3537, "loss": 1.6112, "lr": 1.9505730476922064e-05, "epoch": 1.8405428329092453, "percentage": 61.35, "elapsed_time": "1:15:23", "remaining_time": "0:47:29"}
{"current_steps": 2180, "total_steps": 3537, "loss": 1.6001, "lr": 1.9265286825357742e-05, "epoch": 1.8490245971162, "percentage": 61.63, "elapsed_time": "1:15:43", "remaining_time": "0:47:08"}
{"current_steps": 2190, "total_steps": 3537, "loss": 1.6122, "lr": 1.9025401817156905e-05, "epoch": 1.8575063613231553, "percentage": 61.92, "elapsed_time": "1:16:04", "remaining_time": "0:46:47"}
{"current_steps": 2200, "total_steps": 3537, "loss": 1.5837, "lr": 1.8786098820561972e-05, "epoch": 1.8659881255301103, "percentage": 62.2, "elapsed_time": "1:16:24", "remaining_time": "0:46:26"}
{"current_steps": 2210, "total_steps": 3537, "loss": 1.6056, "lr": 1.8547401147119127e-05, "epoch": 1.8744698897370653, "percentage": 62.48, "elapsed_time": "1:16:44", "remaining_time": "0:46:04"}
{"current_steps": 2220, "total_steps": 3537, "loss": 1.5898, "lr": 1.8309332049407363e-05, "epoch": 1.8829516539440203, "percentage": 62.77, "elapsed_time": "1:17:04", "remaining_time": "0:45:43"}
{"current_steps": 2230, "total_steps": 3537, "loss": 1.5803, "lr": 1.8071914718773393e-05, "epoch": 1.8914334181509753, "percentage": 63.05, "elapsed_time": "1:17:25", "remaining_time": "0:45:22"}
{"current_steps": 2240, "total_steps": 3537, "loss": 1.5908, "lr": 1.783517228307245e-05, "epoch": 1.8999151823579306, "percentage": 63.33, "elapsed_time": "1:17:45", "remaining_time": "0:45:01"}
{"current_steps": 2250, "total_steps": 3537, "loss": 1.6114, "lr": 1.7599127804415317e-05, "epoch": 1.9083969465648853, "percentage": 63.61, "elapsed_time": "1:18:05", "remaining_time": "0:44:40"}
{"current_steps": 2260, "total_steps": 3537, "loss": 1.5835, "lr": 1.7363804276921748e-05, "epoch": 1.9168787107718406, "percentage": 63.9, "elapsed_time": "1:18:26", "remaining_time": "0:44:19"}
{"current_steps": 2270, "total_steps": 3537, "loss": 1.5937, "lr": 1.7129224624480506e-05, "epoch": 1.9253604749787956, "percentage": 64.18, "elapsed_time": "1:18:46", "remaining_time": "0:43:58"}
{"current_steps": 2280, "total_steps": 3537, "loss": 1.6138, "lr": 1.689541169851625e-05, "epoch": 1.9338422391857506, "percentage": 64.46, "elapsed_time": "1:19:06", "remaining_time": "0:43:36"}
{"current_steps": 2290, "total_steps": 3537, "loss": 1.5972, "lr": 1.6662388275763484e-05, "epoch": 1.9423240033927058, "percentage": 64.74, "elapsed_time": "1:19:27", "remaining_time": "0:43:15"}
{"current_steps": 2300, "total_steps": 3537, "loss": 1.6007, "lr": 1.643017705604774e-05, "epoch": 1.9508057675996606, "percentage": 65.03, "elapsed_time": "1:19:47", "remaining_time": "0:42:54"}
{"current_steps": 2310, "total_steps": 3537, "loss": 1.5868, "lr": 1.6198800660074353e-05, "epoch": 1.9592875318066159, "percentage": 65.31, "elapsed_time": "1:20:07", "remaining_time": "0:42:33"}
{"current_steps": 2320, "total_steps": 3537, "loss": 1.5554, "lr": 1.5968281627224823e-05, "epoch": 1.9677692960135709, "percentage": 65.59, "elapsed_time": "1:20:28", "remaining_time": "0:42:12"}
{"current_steps": 2330, "total_steps": 3537, "loss": 1.6222, "lr": 1.573864241336119e-05, "epoch": 1.9762510602205259, "percentage": 65.88, "elapsed_time": "1:20:48", "remaining_time": "0:41:51"}
{"current_steps": 2340, "total_steps": 3537, "loss": 1.5684, "lr": 1.550990538863848e-05, "epoch": 1.984732824427481, "percentage": 66.16, "elapsed_time": "1:21:08", "remaining_time": "0:41:30"}
{"current_steps": 2350, "total_steps": 3537, "loss": 1.6103, "lr": 1.528209283532559e-05, "epoch": 1.993214588634436, "percentage": 66.44, "elapsed_time": "1:21:28", "remaining_time": "0:41:09"}
{"current_steps": 2360, "total_steps": 3537, "loss": 1.5866, "lr": 1.5055226945634571e-05, "epoch": 2.001696352841391, "percentage": 66.72, "elapsed_time": "1:21:49", "remaining_time": "0:40:48"}
{"current_steps": 2370, "total_steps": 3537, "loss": 1.524, "lr": 1.4829329819558905e-05, "epoch": 2.010178117048346, "percentage": 67.01, "elapsed_time": "1:22:09", "remaining_time": "0:40:27"}
{"current_steps": 2380, "total_steps": 3537, "loss": 1.5222, "lr": 1.4604423462720574e-05, "epoch": 2.018659881255301, "percentage": 67.29, "elapsed_time": "1:22:29", "remaining_time": "0:40:06"}
{"current_steps": 2390, "total_steps": 3537, "loss": 1.538, "lr": 1.438052978422641e-05, "epoch": 2.027141645462256, "percentage": 67.57, "elapsed_time": "1:22:50", "remaining_time": "0:39:45"}
{"current_steps": 2400, "total_steps": 3537, "loss": 1.5463, "lr": 1.4157670594533879e-05, "epoch": 2.035623409669211, "percentage": 67.85, "elapsed_time": "1:23:10", "remaining_time": "0:39:24"}
{"current_steps": 2400, "total_steps": 3537, "eval_loss": 1.6182470321655273, "epoch": 2.035623409669211, "percentage": 67.85, "elapsed_time": "1:23:18", "remaining_time": "0:39:28"}
{"current_steps": 2410, "total_steps": 3537, "loss": 1.5402, "lr": 1.393586760332633e-05, "epoch": 2.0441051738761664, "percentage": 68.14, "elapsed_time": "1:23:39", "remaining_time": "0:39:07"}
{"current_steps": 2420, "total_steps": 3537, "loss": 1.5312, "lr": 1.3715142417398275e-05, "epoch": 2.052586938083121, "percentage": 68.42, "elapsed_time": "1:23:59", "remaining_time": "0:38:46"}
{"current_steps": 2430, "total_steps": 3537, "loss": 1.5251, "lr": 1.3495516538550495e-05, "epoch": 2.0610687022900764, "percentage": 68.7, "elapsed_time": "1:24:19", "remaining_time": "0:38:24"}
{"current_steps": 2440, "total_steps": 3537, "loss": 1.5536, "lr": 1.3277011361495498e-05, "epoch": 2.0695504664970312, "percentage": 68.99, "elapsed_time": "1:24:40", "remaining_time": "0:38:03"}
{"current_steps": 2450, "total_steps": 3537, "loss": 1.5608, "lr": 1.3059648171773361e-05, "epoch": 2.0780322307039865, "percentage": 69.27, "elapsed_time": "1:25:00", "remaining_time": "0:37:42"}
{"current_steps": 2460, "total_steps": 3537, "loss": 1.5314, "lr": 1.2843448143678175e-05, "epoch": 2.0865139949109412, "percentage": 69.55, "elapsed_time": "1:25:20", "remaining_time": "0:37:21"}
{"current_steps": 2470, "total_steps": 3537, "loss": 1.5769, "lr": 1.2628432338195423e-05, "epoch": 2.0949957591178965, "percentage": 69.83, "elapsed_time": "1:25:40", "remaining_time": "0:37:00"}
{"current_steps": 2480, "total_steps": 3537, "loss": 1.5392, "lr": 1.2414621700950307e-05, "epoch": 2.1034775233248517, "percentage": 70.12, "elapsed_time": "1:26:01", "remaining_time": "0:36:39"}
{"current_steps": 2490, "total_steps": 3537, "loss": 1.5482, "lr": 1.2202037060167338e-05, "epoch": 2.1119592875318065, "percentage": 70.4, "elapsed_time": "1:26:21", "remaining_time": "0:36:18"}
{"current_steps": 2500, "total_steps": 3537, "loss": 1.5305, "lr": 1.1990699124641385e-05, "epoch": 2.1204410517387617, "percentage": 70.68, "elapsed_time": "1:26:41", "remaining_time": "0:35:57"}
{"current_steps": 2510, "total_steps": 3537, "loss": 1.5205, "lr": 1.1780628481720333e-05, "epoch": 2.1289228159457165, "percentage": 70.96, "elapsed_time": "1:27:24", "remaining_time": "0:35:45"}
{"current_steps": 2520, "total_steps": 3537, "loss": 1.5377, "lr": 1.1571845595299571e-05, "epoch": 2.1374045801526718, "percentage": 71.25, "elapsed_time": "1:27:44", "remaining_time": "0:35:24"}
{"current_steps": 2530, "total_steps": 3537, "loss": 1.5274, "lr": 1.1364370803828536e-05, "epoch": 2.145886344359627, "percentage": 71.53, "elapsed_time": "1:28:04", "remaining_time": "0:35:03"}
{"current_steps": 2540, "total_steps": 3537, "loss": 1.5422, "lr": 1.1158224318329439e-05, "epoch": 2.154368108566582, "percentage": 71.81, "elapsed_time": "1:28:25", "remaining_time": "0:34:42"}
{"current_steps": 2550, "total_steps": 3537, "loss": 1.5189, "lr": 1.0953426220428417e-05, "epoch": 2.162849872773537, "percentage": 72.09, "elapsed_time": "1:28:45", "remaining_time": "0:34:21"}
{"current_steps": 2560, "total_steps": 3537, "loss": 1.545, "lr": 1.0749996460399334e-05, "epoch": 2.171331636980492, "percentage": 72.38, "elapsed_time": "1:29:05", "remaining_time": "0:34:00"}
{"current_steps": 2570, "total_steps": 3537, "loss": 1.5395, "lr": 1.0547954855220258e-05, "epoch": 2.179813401187447, "percentage": 72.66, "elapsed_time": "1:29:26", "remaining_time": "0:33:39"}
{"current_steps": 2580, "total_steps": 3537, "loss": 1.5427, "lr": 1.0347321086643098e-05, "epoch": 2.188295165394402, "percentage": 72.94, "elapsed_time": "1:29:46", "remaining_time": "0:33:17"}
{"current_steps": 2590, "total_steps": 3537, "loss": 1.5424, "lr": 1.0148114699276254e-05, "epoch": 2.196776929601357, "percentage": 73.23, "elapsed_time": "1:30:06", "remaining_time": "0:32:56"}
{"current_steps": 2600, "total_steps": 3537, "loss": 1.5274, "lr": 9.950355098680716e-06, "epoch": 2.2052586938083123, "percentage": 73.51, "elapsed_time": "1:30:27", "remaining_time": "0:32:35"}
{"current_steps": 2610, "total_steps": 3537, "loss": 1.5466, "lr": 9.754061549479684e-06, "epoch": 2.213740458015267, "percentage": 73.79, "elapsed_time": "1:30:47", "remaining_time": "0:32:14"}
{"current_steps": 2620, "total_steps": 3537, "loss": 1.5228, "lr": 9.559253173481894e-06, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "1:31:07", "remaining_time": "0:31:53"}
{"current_steps": 2630, "total_steps": 3537, "loss": 1.5392, "lr": 9.365948947818917e-06, "epoch": 2.230703986429177, "percentage": 74.36, "elapsed_time": "1:31:27", "remaining_time": "0:31:32"}
{"current_steps": 2640, "total_steps": 3537, "loss": 1.5312, "lr": 9.174167703096487e-06, "epoch": 2.2391857506361323, "percentage": 74.64, "elapsed_time": "1:31:48", "remaining_time": "0:31:11"}
{"current_steps": 2650, "total_steps": 3537, "loss": 1.5506, "lr": 8.983928121560142e-06, "epoch": 2.247667514843087, "percentage": 74.92, "elapsed_time": "1:32:08", "remaining_time": "0:30:50"}
{"current_steps": 2660, "total_steps": 3537, "loss": 1.5392, "lr": 8.795248735275295e-06, "epoch": 2.2561492790500424, "percentage": 75.2, "elapsed_time": "1:32:28", "remaining_time": "0:30:29"}
{"current_steps": 2670, "total_steps": 3537, "loss": 1.5313, "lr": 8.608147924321954e-06, "epoch": 2.2646310432569976, "percentage": 75.49, "elapsed_time": "1:32:48", "remaining_time": "0:30:08"}
{"current_steps": 2680, "total_steps": 3537, "loss": 1.5379, "lr": 8.422643915004242e-06, "epoch": 2.2731128074639524, "percentage": 75.77, "elapsed_time": "1:33:09", "remaining_time": "0:29:47"}
{"current_steps": 2690, "total_steps": 3537, "loss": 1.5187, "lr": 8.238754778074869e-06, "epoch": 2.2815945716709076, "percentage": 76.05, "elapsed_time": "1:33:29", "remaining_time": "0:29:26"}
{"current_steps": 2700, "total_steps": 3537, "loss": 1.5436, "lr": 8.056498426974817e-06, "epoch": 2.2900763358778624, "percentage": 76.34, "elapsed_time": "1:33:49", "remaining_time": "0:29:05"}
{"current_steps": 2710, "total_steps": 3537, "loss": 1.5349, "lr": 7.875892616088293e-06, "epoch": 2.2985581000848176, "percentage": 76.62, "elapsed_time": "1:34:10", "remaining_time": "0:28:44"}
{"current_steps": 2720, "total_steps": 3537, "loss": 1.5157, "lr": 7.696954939013182e-06, "epoch": 2.307039864291773, "percentage": 76.9, "elapsed_time": "1:34:30", "remaining_time": "0:28:23"}
{"current_steps": 2730, "total_steps": 3537, "loss": 1.5115, "lr": 7.5197028268472134e-06, "epoch": 2.3155216284987277, "percentage": 77.18, "elapsed_time": "1:34:50", "remaining_time": "0:28:02"}
{"current_steps": 2740, "total_steps": 3537, "loss": 1.5391, "lr": 7.344153546489904e-06, "epoch": 2.324003392705683, "percentage": 77.47, "elapsed_time": "1:35:11", "remaining_time": "0:27:41"}
{"current_steps": 2750, "total_steps": 3537, "loss": 1.5305, "lr": 7.17032419896051e-06, "epoch": 2.3324851569126377, "percentage": 77.75, "elapsed_time": "1:35:31", "remaining_time": "0:27:20"}
{"current_steps": 2760, "total_steps": 3537, "loss": 1.5011, "lr": 6.998231717732148e-06, "epoch": 2.340966921119593, "percentage": 78.03, "elapsed_time": "1:35:51", "remaining_time": "0:26:59"}
{"current_steps": 2770, "total_steps": 3537, "loss": 1.503, "lr": 6.827892867082236e-06, "epoch": 2.349448685326548, "percentage": 78.31, "elapsed_time": "1:36:12", "remaining_time": "0:26:38"}
{"current_steps": 2780, "total_steps": 3537, "loss": 1.5295, "lr": 6.659324240459389e-06, "epoch": 2.357930449533503, "percentage": 78.6, "elapsed_time": "1:36:32", "remaining_time": "0:26:17"}
{"current_steps": 2790, "total_steps": 3537, "loss": 1.539, "lr": 6.492542258867013e-06, "epoch": 2.366412213740458, "percentage": 78.88, "elapsed_time": "1:36:52", "remaining_time": "0:25:56"}
{"current_steps": 2800, "total_steps": 3537, "loss": 1.5195, "lr": 6.327563169263651e-06, "epoch": 2.374893977947413, "percentage": 79.16, "elapsed_time": "1:37:13", "remaining_time": "0:25:35"}
{"current_steps": 2810, "total_steps": 3537, "loss": 1.5154, "lr": 6.164403042980277e-06, "epoch": 2.383375742154368, "percentage": 79.45, "elapsed_time": "1:37:33", "remaining_time": "0:25:14"}
{"current_steps": 2820, "total_steps": 3537, "loss": 1.5294, "lr": 6.00307777415475e-06, "epoch": 2.391857506361323, "percentage": 79.73, "elapsed_time": "1:37:53", "remaining_time": "0:24:53"}
{"current_steps": 2830, "total_steps": 3537, "loss": 1.5282, "lr": 5.843603078183465e-06, "epoch": 2.4003392705682782, "percentage": 80.01, "elapsed_time": "1:38:14", "remaining_time": "0:24:32"}
{"current_steps": 2840, "total_steps": 3537, "loss": 1.5159, "lr": 5.685994490190474e-06, "epoch": 2.408821034775233, "percentage": 80.29, "elapsed_time": "1:38:34", "remaining_time": "0:24:11"}
{"current_steps": 2850, "total_steps": 3537, "loss": 1.5402, "lr": 5.530267363514124e-06, "epoch": 2.4173027989821882, "percentage": 80.58, "elapsed_time": "1:38:54", "remaining_time": "0:23:50"}
{"current_steps": 2860, "total_steps": 3537, "loss": 1.5255, "lr": 5.3764368682114315e-06, "epoch": 2.4257845631891435, "percentage": 80.86, "elapsed_time": "1:39:15", "remaining_time": "0:23:29"}
{"current_steps": 2870, "total_steps": 3537, "loss": 1.5335, "lr": 5.2245179895803044e-06, "epoch": 2.4342663273960983, "percentage": 81.14, "elapsed_time": "1:39:35", "remaining_time": "0:23:08"}
{"current_steps": 2880, "total_steps": 3537, "loss": 1.5305, "lr": 5.074525526699736e-06, "epoch": 2.4427480916030535, "percentage": 81.42, "elapsed_time": "1:39:56", "remaining_time": "0:22:47"}
{"current_steps": 2890, "total_steps": 3537, "loss": 1.5533, "lr": 4.926474090988193e-06, "epoch": 2.4512298558100083, "percentage": 81.71, "elapsed_time": "1:40:16", "remaining_time": "0:22:26"}
{"current_steps": 2900, "total_steps": 3537, "loss": 1.5158, "lr": 4.780378104780234e-06, "epoch": 2.4597116200169635, "percentage": 81.99, "elapsed_time": "1:40:36", "remaining_time": "0:22:05"}
{"current_steps": 2910, "total_steps": 3537, "loss": 1.525, "lr": 4.636251799921579e-06, "epoch": 2.4681933842239188, "percentage": 82.27, "elapsed_time": "1:40:57", "remaining_time": "0:21:45"}
{"current_steps": 2920, "total_steps": 3537, "loss": 1.514, "lr": 4.4941092163827135e-06, "epoch": 2.4766751484308736, "percentage": 82.56, "elapsed_time": "1:41:17", "remaining_time": "0:21:24"}
{"current_steps": 2930, "total_steps": 3537, "loss": 1.5393, "lr": 4.353964200891192e-06, "epoch": 2.485156912637829, "percentage": 82.84, "elapsed_time": "1:41:37", "remaining_time": "0:21:03"}
{"current_steps": 2940, "total_steps": 3537, "loss": 1.5401, "lr": 4.215830405582777e-06, "epoch": 2.4936386768447836, "percentage": 83.12, "elapsed_time": "1:41:57", "remaining_time": "0:20:42"}
{"current_steps": 2950, "total_steps": 3537, "loss": 1.5417, "lr": 4.079721286671528e-06, "epoch": 2.502120441051739, "percentage": 83.4, "elapsed_time": "1:42:18", "remaining_time": "0:20:21"}
{"current_steps": 2960, "total_steps": 3537, "loss": 1.5291, "lr": 3.945650103138962e-06, "epoch": 2.510602205258694, "percentage": 83.69, "elapsed_time": "1:42:38", "remaining_time": "0:20:00"}
{"current_steps": 2970, "total_steps": 3537, "loss": 1.5305, "lr": 3.813629915442435e-06, "epoch": 2.519083969465649, "percentage": 83.97, "elapsed_time": "1:42:58", "remaining_time": "0:19:39"}
{"current_steps": 2980, "total_steps": 3537, "loss": 1.5355, "lr": 3.6836735842429027e-06, "epoch": 2.527565733672604, "percentage": 84.25, "elapsed_time": "1:43:19", "remaining_time": "0:19:18"}
{"current_steps": 2990, "total_steps": 3537, "loss": 1.5618, "lr": 3.5557937691520382e-06, "epoch": 2.536047497879559, "percentage": 84.53, "elapsed_time": "1:43:39", "remaining_time": "0:18:57"}
{"current_steps": 3000, "total_steps": 3537, "loss": 1.5356, "lr": 3.4300029274990734e-06, "epoch": 2.544529262086514, "percentage": 84.82, "elapsed_time": "1:43:59", "remaining_time": "0:18:36"}
{"current_steps": 3000, "total_steps": 3537, "eval_loss": 1.6116546392440796, "epoch": 2.544529262086514, "percentage": 84.82, "elapsed_time": "1:44:08", "remaining_time": "0:18:38"}
{"current_steps": 3010, "total_steps": 3537, "loss": 1.5331, "lr": 3.3063133131172403e-06, "epoch": 2.553011026293469, "percentage": 85.1, "elapsed_time": "1:44:51", "remaining_time": "0:18:21"}
{"current_steps": 3020, "total_steps": 3537, "loss": 1.5251, "lr": 3.1847369751500766e-06, "epoch": 2.561492790500424, "percentage": 85.38, "elapsed_time": "1:45:11", "remaining_time": "0:18:00"}
{"current_steps": 3030, "total_steps": 3537, "loss": 1.5296, "lr": 3.065285756877684e-06, "epoch": 2.569974554707379, "percentage": 85.67, "elapsed_time": "1:45:32", "remaining_time": "0:17:39"}
{"current_steps": 3040, "total_steps": 3537, "loss": 1.5432, "lr": 2.947971294562976e-06, "epoch": 2.578456318914334, "percentage": 85.95, "elapsed_time": "1:45:52", "remaining_time": "0:17:18"}
{"current_steps": 3050, "total_steps": 3537, "loss": 1.5209, "lr": 2.8328050163182017e-06, "epoch": 2.5869380831212894, "percentage": 86.23, "elapsed_time": "1:46:12", "remaining_time": "0:16:57"}
{"current_steps": 3060, "total_steps": 3537, "loss": 1.5096, "lr": 2.7197981409916416e-06, "epoch": 2.595419847328244, "percentage": 86.51, "elapsed_time": "1:46:33", "remaining_time": "0:16:36"}
{"current_steps": 3070, "total_steps": 3537, "loss": 1.5133, "lr": 2.6089616770747394e-06, "epoch": 2.6039016115351994, "percentage": 86.8, "elapsed_time": "1:46:53", "remaining_time": "0:16:15"}
{"current_steps": 3080, "total_steps": 3537, "loss": 1.5477, "lr": 2.500306421629728e-06, "epoch": 2.612383375742154, "percentage": 87.08, "elapsed_time": "1:47:13", "remaining_time": "0:15:54"}
{"current_steps": 3090, "total_steps": 3537, "loss": 1.5082, "lr": 2.393842959237813e-06, "epoch": 2.6208651399491094, "percentage": 87.36, "elapsed_time": "1:47:34", "remaining_time": "0:15:33"}
{"current_steps": 3100, "total_steps": 3537, "loss": 1.5568, "lr": 2.289581660968121e-06, "epoch": 2.6293469041560646, "percentage": 87.64, "elapsed_time": "1:47:54", "remaining_time": "0:15:12"}
{"current_steps": 3110, "total_steps": 3537, "loss": 1.5065, "lr": 2.187532683367385e-06, "epoch": 2.6378286683630194, "percentage": 87.93, "elapsed_time": "1:48:14", "remaining_time": "0:14:51"}
{"current_steps": 3120, "total_steps": 3537, "loss": 1.5217, "lr": 2.0877059674705464e-06, "epoch": 2.6463104325699747, "percentage": 88.21, "elapsed_time": "1:48:35", "remaining_time": "0:14:30"}
{"current_steps": 3130, "total_steps": 3537, "loss": 1.5044, "lr": 1.9901112378323846e-06, "epoch": 2.6547921967769295, "percentage": 88.49, "elapsed_time": "1:48:55", "remaining_time": "0:14:09"}
{"current_steps": 3140, "total_steps": 3537, "loss": 1.536, "lr": 1.8947580015801575e-06, "epoch": 2.6632739609838847, "percentage": 88.78, "elapsed_time": "1:49:15", "remaining_time": "0:13:48"}
{"current_steps": 3150, "total_steps": 3537, "loss": 1.5325, "lr": 1.8016555474875213e-06, "epoch": 2.67175572519084, "percentage": 89.06, "elapsed_time": "1:49:35", "remaining_time": "0:13:27"}
{"current_steps": 3160, "total_steps": 3537, "loss": 1.5302, "lr": 1.710812945069637e-06, "epoch": 2.6802374893977947, "percentage": 89.34, "elapsed_time": "1:49:56", "remaining_time": "0:13:06"}
{"current_steps": 3170, "total_steps": 3537, "loss": 1.5353, "lr": 1.622239043699686e-06, "epoch": 2.68871925360475, "percentage": 89.62, "elapsed_time": "1:50:16", "remaining_time": "0:12:46"}
{"current_steps": 3180, "total_steps": 3537, "loss": 1.5171, "lr": 1.535942471746807e-06, "epoch": 2.6972010178117047, "percentage": 89.91, "elapsed_time": "1:50:36", "remaining_time": "0:12:25"}
{"current_steps": 3190, "total_steps": 3537, "loss": 1.5308, "lr": 1.4519316357355733e-06, "epoch": 2.70568278201866, "percentage": 90.19, "elapsed_time": "1:50:57", "remaining_time": "0:12:04"}
{"current_steps": 3200, "total_steps": 3537, "loss": 1.5366, "lr": 1.3702147195270687e-06, "epoch": 2.714164546225615, "percentage": 90.47, "elapsed_time": "1:51:17", "remaining_time": "0:11:43"}
{"current_steps": 3210, "total_steps": 3537, "loss": 1.5148, "lr": 1.2907996835216734e-06, "epoch": 2.72264631043257, "percentage": 90.75, "elapsed_time": "1:51:37", "remaining_time": "0:11:22"}
{"current_steps": 3220, "total_steps": 3537, "loss": 1.5228, "lr": 1.2136942638835995e-06, "epoch": 2.731128074639525, "percentage": 91.04, "elapsed_time": "1:51:57", "remaining_time": "0:11:01"}
{"current_steps": 3230, "total_steps": 3537, "loss": 1.5197, "lr": 1.1389059717872741e-06, "epoch": 2.73960983884648, "percentage": 91.32, "elapsed_time": "1:52:18", "remaining_time": "0:10:40"}
{"current_steps": 3240, "total_steps": 3537, "loss": 1.5125, "lr": 1.06644209268566e-06, "epoch": 2.7480916030534353, "percentage": 91.6, "elapsed_time": "1:52:38", "remaining_time": "0:10:19"}
{"current_steps": 3250, "total_steps": 3537, "loss": 1.5549, "lr": 9.963096856005216e-07, "epoch": 2.75657336726039, "percentage": 91.89, "elapsed_time": "1:52:58", "remaining_time": "0:09:58"}
{"current_steps": 3260, "total_steps": 3537, "loss": 1.5183, "lr": 9.285155824347969e-07, "epoch": 2.7650551314673453, "percentage": 92.17, "elapsed_time": "1:53:19", "remaining_time": "0:09:37"}
{"current_steps": 3270, "total_steps": 3537, "loss": 1.5323, "lr": 8.630663873070627e-07, "epoch": 2.7735368956743, "percentage": 92.45, "elapsed_time": "1:53:39", "remaining_time": "0:09:16"}
{"current_steps": 3280, "total_steps": 3537, "loss": 1.5202, "lr": 7.999684759082083e-07, "epoch": 2.7820186598812553, "percentage": 92.73, "elapsed_time": "1:53:59", "remaining_time": "0:08:55"}
{"current_steps": 3290, "total_steps": 3537, "loss": 1.541, "lr": 7.392279948803371e-07, "epoch": 2.7905004240882105, "percentage": 93.02, "elapsed_time": "1:54:20", "remaining_time": "0:08:35"}
{"current_steps": 3300, "total_steps": 3537, "loss": 1.5437, "lr": 6.808508612179937e-07, "epoch": 2.7989821882951653, "percentage": 93.3, "elapsed_time": "1:54:40", "remaining_time": "0:08:14"}
{"current_steps": 3310, "total_steps": 3537, "loss": 1.5489, "lr": 6.248427616917907e-07, "epoch": 2.8074639525021206, "percentage": 93.58, "elapsed_time": "1:55:00", "remaining_time": "0:07:53"}
{"current_steps": 3320, "total_steps": 3537, "loss": 1.5159, "lr": 5.712091522943996e-07, "epoch": 2.8159457167090753, "percentage": 93.86, "elapsed_time": "1:55:20", "remaining_time": "0:07:32"}
{"current_steps": 3330, "total_steps": 3537, "loss": 1.5359, "lr": 5.199552577090927e-07, "epoch": 2.8244274809160306, "percentage": 94.15, "elapsed_time": "1:55:41", "remaining_time": "0:07:11"}
{"current_steps": 3340, "total_steps": 3537, "loss": 1.5281, "lr": 4.710860708007553e-07, "epoch": 2.832909245122986, "percentage": 94.43, "elapsed_time": "1:56:01", "remaining_time": "0:06:50"}
{"current_steps": 3350, "total_steps": 3537, "loss": 1.511, "lr": 4.2460635212952515e-07, "epoch": 2.8413910093299406, "percentage": 94.71, "elapsed_time": "1:56:21", "remaining_time": "0:06:29"}
{"current_steps": 3360, "total_steps": 3537, "loss": 1.5074, "lr": 3.805206294870439e-07, "epoch": 2.849872773536896, "percentage": 95.0, "elapsed_time": "1:56:42", "remaining_time": "0:06:08"}
{"current_steps": 3370, "total_steps": 3537, "loss": 1.5001, "lr": 3.388331974553821e-07, "epoch": 2.8583545377438506, "percentage": 95.28, "elapsed_time": "1:57:02", "remaining_time": "0:05:47"}
{"current_steps": 3380, "total_steps": 3537, "loss": 1.5362, "lr": 2.995481169886849e-07, "epoch": 2.866836301950806, "percentage": 95.56, "elapsed_time": "1:57:22", "remaining_time": "0:05:27"}
{"current_steps": 3390, "total_steps": 3537, "loss": 1.5205, "lr": 2.6266921501758024e-07, "epoch": 2.875318066157761, "percentage": 95.84, "elapsed_time": "1:57:42", "remaining_time": "0:05:06"}
{"current_steps": 3400, "total_steps": 3537, "loss": 1.5117, "lr": 2.2820008407637983e-07, "epoch": 2.883799830364716, "percentage": 96.13, "elapsed_time": "1:58:03", "remaining_time": "0:04:45"}
{"current_steps": 3410, "total_steps": 3537, "loss": 1.5184, "lr": 1.9614408195310907e-07, "epoch": 2.8922815945716707, "percentage": 96.41, "elapsed_time": "1:58:23", "remaining_time": "0:04:24"}
{"current_steps": 3420, "total_steps": 3537, "loss": 1.5141, "lr": 1.6650433136241872e-07, "epoch": 2.900763358778626, "percentage": 96.69, "elapsed_time": "1:58:43", "remaining_time": "0:04:03"}
{"current_steps": 3430, "total_steps": 3537, "loss": 1.5328, "lr": 1.3928371964138653e-07, "epoch": 2.909245122985581, "percentage": 96.97, "elapsed_time": "1:59:04", "remaining_time": "0:03:42"}
{"current_steps": 3440, "total_steps": 3537, "loss": 1.5251, "lr": 1.1448489846824228e-07, "epoch": 2.917726887192536, "percentage": 97.26, "elapsed_time": "1:59:24", "remaining_time": "0:03:22"}
{"current_steps": 3450, "total_steps": 3537, "loss": 1.5303, "lr": 9.211028360406326e-08, "epoch": 2.926208651399491, "percentage": 97.54, "elapsed_time": "1:59:44", "remaining_time": "0:03:01"}
{"current_steps": 3460, "total_steps": 3537, "loss": 1.5128, "lr": 7.216205465743753e-08, "epoch": 2.934690415606446, "percentage": 97.82, "elapsed_time": "2:00:05", "remaining_time": "0:02:40"}
{"current_steps": 3470, "total_steps": 3537, "loss": 1.5382, "lr": 5.464215487214763e-08, "epoch": 2.943172179813401, "percentage": 98.11, "elapsed_time": "2:00:25", "remaining_time": "0:02:19"}
{"current_steps": 3480, "total_steps": 3537, "loss": 1.5374, "lr": 3.95522909378665e-08, "epoch": 2.9516539440203564, "percentage": 98.39, "elapsed_time": "2:00:45", "remaining_time": "0:01:58"}
{"current_steps": 3490, "total_steps": 3537, "loss": 1.5138, "lr": 2.6893932823898738e-08, "epoch": 2.960135708227311, "percentage": 98.67, "elapsed_time": "2:01:06", "remaining_time": "0:01:37"}
{"current_steps": 3500, "total_steps": 3537, "loss": 1.5293, "lr": 1.666831363598964e-08, "epoch": 2.9686174724342664, "percentage": 98.95, "elapsed_time": "2:01:26", "remaining_time": "0:01:17"}
{"current_steps": 3510, "total_steps": 3537, "loss": 1.545, "lr": 8.876429496193494e-09, "epoch": 2.9770992366412212, "percentage": 99.24, "elapsed_time": "2:02:09", "remaining_time": "0:00:56"}
{"current_steps": 3520, "total_steps": 3537, "loss": 1.5387, "lr": 3.519039445851191e-09, "epoch": 2.9855810008481765, "percentage": 99.52, "elapsed_time": "2:02:29", "remaining_time": "0:00:35"}
{"current_steps": 3530, "total_steps": 3537, "loss": 1.533, "lr": 5.966653716410476e-10, "epoch": 2.9940627650551317, "percentage": 99.8, "elapsed_time": "2:02:49", "remaining_time": "0:00:14"}
{"current_steps": 3537, "total_steps": 3537, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:03:23", "remaining_time": "0:00:00"}