Upload trainer_log.jsonl with huggingface_hub
Browse files- trainer_log.jsonl +124 -0
trainer_log.jsonl
ADDED
@@ -0,0 +1,124 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"current_steps": 1, "total_steps": 123, "loss": 1.0549, "lr": 5e-06, "epoch": 0.024390243902439025, "percentage": 0.81, "elapsed_time": "0:00:09", "remaining_time": "0:19:45"}
|
2 |
+
{"current_steps": 2, "total_steps": 123, "loss": 1.1685, "lr": 1e-05, "epoch": 0.04878048780487805, "percentage": 1.63, "elapsed_time": "0:00:16", "remaining_time": "0:16:11"}
|
3 |
+
{"current_steps": 3, "total_steps": 123, "loss": 1.0412, "lr": 1.5000000000000002e-05, "epoch": 0.07317073170731707, "percentage": 2.44, "elapsed_time": "0:00:22", "remaining_time": "0:15:10"}
|
4 |
+
{"current_steps": 4, "total_steps": 123, "loss": 0.9748, "lr": 2e-05, "epoch": 0.0975609756097561, "percentage": 3.25, "elapsed_time": "0:00:29", "remaining_time": "0:14:29"}
|
5 |
+
{"current_steps": 5, "total_steps": 123, "loss": 0.8506, "lr": 1.9996515418688493e-05, "epoch": 0.12195121951219512, "percentage": 4.07, "elapsed_time": "0:00:36", "remaining_time": "0:14:11"}
|
6 |
+
{"current_steps": 6, "total_steps": 123, "loss": 0.9128, "lr": 1.998606410321534e-05, "epoch": 0.14634146341463414, "percentage": 4.88, "elapsed_time": "0:00:44", "remaining_time": "0:14:25"}
|
7 |
+
{"current_steps": 7, "total_steps": 123, "loss": 0.9204, "lr": 1.9968653337272262e-05, "epoch": 0.17073170731707318, "percentage": 5.69, "elapsed_time": "0:00:50", "remaining_time": "0:14:01"}
|
8 |
+
{"current_steps": 8, "total_steps": 123, "loss": 0.9038, "lr": 1.9944295254705187e-05, "epoch": 0.1951219512195122, "percentage": 6.5, "elapsed_time": "0:00:57", "remaining_time": "0:13:41"}
|
9 |
+
{"current_steps": 9, "total_steps": 123, "loss": 0.9088, "lr": 1.9913006831057967e-05, "epoch": 0.21951219512195122, "percentage": 7.32, "elapsed_time": "0:01:05", "remaining_time": "0:13:46"}
|
10 |
+
{"current_steps": 10, "total_steps": 123, "loss": 0.8595, "lr": 1.9874809871741877e-05, "epoch": 0.24390243902439024, "percentage": 8.13, "elapsed_time": "0:01:12", "remaining_time": "0:13:38"}
|
11 |
+
{"current_steps": 11, "total_steps": 123, "loss": 0.9451, "lr": 1.982973099683902e-05, "epoch": 0.2682926829268293, "percentage": 8.94, "elapsed_time": "0:01:20", "remaining_time": "0:13:34"}
|
12 |
+
{"current_steps": 12, "total_steps": 123, "loss": 0.8742, "lr": 1.977780162255041e-05, "epoch": 0.2926829268292683, "percentage": 9.76, "elapsed_time": "0:01:27", "remaining_time": "0:13:30"}
|
13 |
+
{"current_steps": 13, "total_steps": 123, "loss": 0.8587, "lr": 1.9719057939301477e-05, "epoch": 0.3170731707317073, "percentage": 10.57, "elapsed_time": "0:01:33", "remaining_time": "0:13:15"}
|
14 |
+
{"current_steps": 14, "total_steps": 123, "loss": 0.8857, "lr": 1.9653540886520387e-05, "epoch": 0.34146341463414637, "percentage": 11.38, "elapsed_time": "0:01:41", "remaining_time": "0:13:09"}
|
15 |
+
{"current_steps": 15, "total_steps": 123, "loss": 0.8348, "lr": 1.9581296124106682e-05, "epoch": 0.36585365853658536, "percentage": 12.2, "elapsed_time": "0:01:49", "remaining_time": "0:13:05"}
|
16 |
+
{"current_steps": 16, "total_steps": 123, "loss": 0.7771, "lr": 1.9502374000610152e-05, "epoch": 0.3902439024390244, "percentage": 13.01, "elapsed_time": "0:01:55", "remaining_time": "0:12:55"}
|
17 |
+
{"current_steps": 17, "total_steps": 123, "loss": 0.8669, "lr": 1.941682951814212e-05, "epoch": 0.4146341463414634, "percentage": 13.82, "elapsed_time": "0:02:02", "remaining_time": "0:12:46"}
|
18 |
+
{"current_steps": 18, "total_steps": 123, "loss": 0.8422, "lr": 1.932472229404356e-05, "epoch": 0.43902439024390244, "percentage": 14.63, "elapsed_time": "0:02:09", "remaining_time": "0:12:35"}
|
19 |
+
{"current_steps": 19, "total_steps": 123, "loss": 0.8974, "lr": 1.922611651933683e-05, "epoch": 0.4634146341463415, "percentage": 15.45, "elapsed_time": "0:02:16", "remaining_time": "0:12:27"}
|
20 |
+
{"current_steps": 20, "total_steps": 123, "loss": 0.8578, "lr": 1.912108091398988e-05, "epoch": 0.4878048780487805, "percentage": 16.26, "elapsed_time": "0:02:23", "remaining_time": "0:12:19"}
|
21 |
+
{"current_steps": 21, "total_steps": 123, "loss": 0.9079, "lr": 1.900968867902419e-05, "epoch": 0.5121951219512195, "percentage": 17.07, "elapsed_time": "0:02:31", "remaining_time": "0:12:13"}
|
22 |
+
{"current_steps": 22, "total_steps": 123, "loss": 0.8396, "lr": 1.8892017445499812e-05, "epoch": 0.5365853658536586, "percentage": 17.89, "elapsed_time": "0:02:39", "remaining_time": "0:12:10"}
|
23 |
+
{"current_steps": 23, "total_steps": 123, "loss": 0.8946, "lr": 1.876814922041299e-05, "epoch": 0.5609756097560976, "percentage": 18.7, "elapsed_time": "0:02:46", "remaining_time": "0:12:05"}
|
24 |
+
{"current_steps": 24, "total_steps": 123, "loss": 0.8624, "lr": 1.8638170329544164e-05, "epoch": 0.5853658536585366, "percentage": 19.51, "elapsed_time": "0:02:53", "remaining_time": "0:11:55"}
|
25 |
+
{"current_steps": 25, "total_steps": 123, "loss": 0.9318, "lr": 1.8502171357296144e-05, "epoch": 0.6097560975609756, "percentage": 20.33, "elapsed_time": "0:03:00", "remaining_time": "0:11:46"}
|
26 |
+
{"current_steps": 26, "total_steps": 123, "loss": 0.9336, "lr": 1.8360247083564343e-05, "epoch": 0.6341463414634146, "percentage": 21.14, "elapsed_time": "0:03:06", "remaining_time": "0:11:36"}
|
27 |
+
{"current_steps": 27, "total_steps": 123, "loss": 0.9187, "lr": 1.8212496417683135e-05, "epoch": 0.6585365853658537, "percentage": 21.95, "elapsed_time": "0:03:13", "remaining_time": "0:11:27"}
|
28 |
+
{"current_steps": 28, "total_steps": 123, "loss": 0.8898, "lr": 1.805902232949435e-05, "epoch": 0.6829268292682927, "percentage": 22.76, "elapsed_time": "0:03:20", "remaining_time": "0:11:19"}
|
29 |
+
{"current_steps": 29, "total_steps": 123, "loss": 0.9139, "lr": 1.789993177758588e-05, "epoch": 0.7073170731707317, "percentage": 23.58, "elapsed_time": "0:03:27", "remaining_time": "0:11:13"}
|
30 |
+
{"current_steps": 30, "total_steps": 123, "loss": 0.8763, "lr": 1.773533563475053e-05, "epoch": 0.7317073170731707, "percentage": 24.39, "elapsed_time": "0:03:34", "remaining_time": "0:11:04"}
|
31 |
+
{"current_steps": 31, "total_steps": 123, "loss": 0.8888, "lr": 1.7565348610716963e-05, "epoch": 0.7560975609756098, "percentage": 25.2, "elapsed_time": "0:03:41", "remaining_time": "0:10:56"}
|
32 |
+
{"current_steps": 32, "total_steps": 123, "loss": 0.8847, "lr": 1.7390089172206594e-05, "epoch": 0.7804878048780488, "percentage": 26.02, "elapsed_time": "0:03:48", "remaining_time": "0:10:49"}
|
33 |
+
{"current_steps": 33, "total_steps": 123, "loss": 0.8353, "lr": 1.720967946037225e-05, "epoch": 0.8048780487804879, "percentage": 26.83, "elapsed_time": "0:03:56", "remaining_time": "0:10:43"}
|
34 |
+
{"current_steps": 34, "total_steps": 123, "loss": 0.8654, "lr": 1.7024245205675986e-05, "epoch": 0.8292682926829268, "percentage": 27.64, "elapsed_time": "0:04:03", "remaining_time": "0:10:36"}
|
35 |
+
{"current_steps": 35, "total_steps": 123, "loss": 0.8966, "lr": 1.6833915640265485e-05, "epoch": 0.8536585365853658, "percentage": 28.46, "elapsed_time": "0:04:10", "remaining_time": "0:10:31"}
|
36 |
+
{"current_steps": 36, "total_steps": 123, "loss": 0.8416, "lr": 1.6638823407910085e-05, "epoch": 0.8780487804878049, "percentage": 29.27, "elapsed_time": "0:04:18", "remaining_time": "0:10:24"}
|
37 |
+
{"current_steps": 37, "total_steps": 123, "loss": 0.82, "lr": 1.6439104471559157e-05, "epoch": 0.9024390243902439, "percentage": 30.08, "elapsed_time": "0:04:25", "remaining_time": "0:10:16"}
|
38 |
+
{"current_steps": 38, "total_steps": 123, "loss": 0.8381, "lr": 1.6234898018587336e-05, "epoch": 0.926829268292683, "percentage": 30.89, "elapsed_time": "0:04:33", "remaining_time": "0:10:10"}
|
39 |
+
{"current_steps": 39, "total_steps": 123, "loss": 0.8611, "lr": 1.6026346363792565e-05, "epoch": 0.9512195121951219, "percentage": 31.71, "elapsed_time": "0:04:39", "remaining_time": "0:10:02"}
|
40 |
+
{"current_steps": 40, "total_steps": 123, "loss": 0.8481, "lr": 1.58135948502146e-05, "epoch": 0.975609756097561, "percentage": 32.52, "elapsed_time": "0:04:46", "remaining_time": "0:09:53"}
|
41 |
+
{"current_steps": 41, "total_steps": 123, "loss": 0.7623, "lr": 1.5596791747843083e-05, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:04:52", "remaining_time": "0:09:45"}
|
42 |
+
{"current_steps": 42, "total_steps": 123, "loss": 0.5314, "lr": 1.5376088150285777e-05, "epoch": 1.024390243902439, "percentage": 34.15, "elapsed_time": "0:04:59", "remaining_time": "0:09:36"}
|
43 |
+
{"current_steps": 43, "total_steps": 123, "loss": 0.5289, "lr": 1.515163786946896e-05, "epoch": 1.048780487804878, "percentage": 34.96, "elapsed_time": "0:05:06", "remaining_time": "0:09:30"}
|
44 |
+
{"current_steps": 44, "total_steps": 123, "loss": 0.4823, "lr": 1.4923597328443423e-05, "epoch": 1.0731707317073171, "percentage": 35.77, "elapsed_time": "0:05:14", "remaining_time": "0:09:23"}
|
45 |
+
{"current_steps": 45, "total_steps": 123, "loss": 0.452, "lr": 1.4692125452370664e-05, "epoch": 1.0975609756097562, "percentage": 36.59, "elapsed_time": "0:05:21", "remaining_time": "0:09:17"}
|
46 |
+
{"current_steps": 46, "total_steps": 123, "loss": 0.4766, "lr": 1.4457383557765385e-05, "epoch": 1.1219512195121952, "percentage": 37.4, "elapsed_time": "0:05:28", "remaining_time": "0:09:09"}
|
47 |
+
{"current_steps": 47, "total_steps": 123, "loss": 0.4987, "lr": 1.4219535240071378e-05, "epoch": 1.146341463414634, "percentage": 38.21, "elapsed_time": "0:05:35", "remaining_time": "0:09:01"}
|
48 |
+
{"current_steps": 48, "total_steps": 123, "loss": 0.4782, "lr": 1.397874625964921e-05, "epoch": 1.170731707317073, "percentage": 39.02, "elapsed_time": "0:05:42", "remaining_time": "0:08:54"}
|
49 |
+
{"current_steps": 49, "total_steps": 123, "loss": 0.4167, "lr": 1.3735184426255117e-05, "epoch": 1.1951219512195121, "percentage": 39.84, "elapsed_time": "0:05:48", "remaining_time": "0:08:47"}
|
50 |
+
{"current_steps": 50, "total_steps": 123, "loss": 0.4421, "lr": 1.348901948209167e-05, "epoch": 1.2195121951219512, "percentage": 40.65, "elapsed_time": "0:05:56", "remaining_time": "0:08:40"}
|
51 |
+
{"current_steps": 51, "total_steps": 123, "loss": 0.4809, "lr": 1.324042298351166e-05, "epoch": 1.2439024390243902, "percentage": 41.46, "elapsed_time": "0:06:03", "remaining_time": "0:08:32"}
|
52 |
+
{"current_steps": 52, "total_steps": 123, "loss": 0.4607, "lr": 1.2989568181457704e-05, "epoch": 1.2682926829268293, "percentage": 42.28, "elapsed_time": "0:06:10", "remaining_time": "0:08:25"}
|
53 |
+
{"current_steps": 53, "total_steps": 123, "loss": 0.4786, "lr": 1.2736629900720832e-05, "epoch": 1.2926829268292683, "percentage": 43.09, "elapsed_time": "0:06:17", "remaining_time": "0:08:18"}
|
54 |
+
{"current_steps": 54, "total_steps": 123, "loss": 0.4772, "lr": 1.248178441810224e-05, "epoch": 1.3170731707317074, "percentage": 43.9, "elapsed_time": "0:06:23", "remaining_time": "0:08:10"}
|
55 |
+
{"current_steps": 55, "total_steps": 123, "loss": 0.4517, "lr": 1.2225209339563144e-05, "epoch": 1.3414634146341464, "percentage": 44.72, "elapsed_time": "0:06:31", "remaining_time": "0:08:04"}
|
56 |
+
{"current_steps": 56, "total_steps": 123, "loss": 0.3793, "lr": 1.1967083476448282e-05, "epoch": 1.3658536585365852, "percentage": 45.53, "elapsed_time": "0:06:39", "remaining_time": "0:07:58"}
|
57 |
+
{"current_steps": 57, "total_steps": 123, "loss": 0.4718, "lr": 1.1707586720869375e-05, "epoch": 1.3902439024390243, "percentage": 46.34, "elapsed_time": "0:06:47", "remaining_time": "0:07:51"}
|
58 |
+
{"current_steps": 58, "total_steps": 123, "loss": 0.4719, "lr": 1.1446899920335407e-05, "epoch": 1.4146341463414633, "percentage": 47.15, "elapsed_time": "0:06:53", "remaining_time": "0:07:43"}
|
59 |
+
{"current_steps": 59, "total_steps": 123, "loss": 0.4873, "lr": 1.118520475171703e-05, "epoch": 1.4390243902439024, "percentage": 47.97, "elapsed_time": "0:07:00", "remaining_time": "0:07:36"}
|
60 |
+
{"current_steps": 60, "total_steps": 123, "loss": 0.4539, "lr": 1.092268359463302e-05, "epoch": 1.4634146341463414, "percentage": 48.78, "elapsed_time": "0:07:08", "remaining_time": "0:07:29"}
|
61 |
+
{"current_steps": 61, "total_steps": 123, "loss": 0.4164, "lr": 1.0659519404346955e-05, "epoch": 1.4878048780487805, "percentage": 49.59, "elapsed_time": "0:07:15", "remaining_time": "0:07:22"}
|
62 |
+
{"current_steps": 62, "total_steps": 123, "loss": 0.466, "lr": 1.0395895584262696e-05, "epoch": 1.5121951219512195, "percentage": 50.41, "elapsed_time": "0:07:21", "remaining_time": "0:07:14"}
|
63 |
+
{"current_steps": 63, "total_steps": 123, "loss": 0.4534, "lr": 1.013199585810759e-05, "epoch": 1.5365853658536586, "percentage": 51.22, "elapsed_time": "0:07:29", "remaining_time": "0:07:08"}
|
64 |
+
{"current_steps": 64, "total_steps": 123, "loss": 0.4427, "lr": 9.868004141892412e-06, "epoch": 1.5609756097560976, "percentage": 52.03, "elapsed_time": "0:07:37", "remaining_time": "0:07:01"}
|
65 |
+
{"current_steps": 65, "total_steps": 123, "loss": 0.511, "lr": 9.604104415737309e-06, "epoch": 1.5853658536585367, "percentage": 52.85, "elapsed_time": "0:07:44", "remaining_time": "0:06:54"}
|
66 |
+
{"current_steps": 66, "total_steps": 123, "loss": 0.4375, "lr": 9.340480595653047e-06, "epoch": 1.6097560975609757, "percentage": 53.66, "elapsed_time": "0:07:50", "remaining_time": "0:06:46"}
|
67 |
+
{"current_steps": 67, "total_steps": 123, "loss": 0.4279, "lr": 9.07731640536698e-06, "epoch": 1.6341463414634148, "percentage": 54.47, "elapsed_time": "0:07:57", "remaining_time": "0:06:38"}
|
68 |
+
{"current_steps": 68, "total_steps": 123, "loss": 0.3974, "lr": 8.814795248282974e-06, "epoch": 1.6585365853658538, "percentage": 55.28, "elapsed_time": "0:08:04", "remaining_time": "0:06:31"}
|
69 |
+
{"current_steps": 69, "total_steps": 123, "loss": 0.4052, "lr": 8.553100079664598e-06, "epoch": 1.6829268292682928, "percentage": 56.1, "elapsed_time": "0:08:10", "remaining_time": "0:06:23"}
|
70 |
+
{"current_steps": 70, "total_steps": 123, "loss": 0.4258, "lr": 8.292413279130625e-06, "epoch": 1.7073170731707317, "percentage": 56.91, "elapsed_time": "0:08:18", "remaining_time": "0:06:17"}
|
71 |
+
{"current_steps": 71, "total_steps": 123, "loss": 0.5169, "lr": 8.03291652355172e-06, "epoch": 1.7317073170731707, "percentage": 57.72, "elapsed_time": "0:08:24", "remaining_time": "0:06:09"}
|
72 |
+
{"current_steps": 72, "total_steps": 123, "loss": 0.4179, "lr": 7.774790660436857e-06, "epoch": 1.7560975609756098, "percentage": 58.54, "elapsed_time": "0:08:30", "remaining_time": "0:06:01"}
|
73 |
+
{"current_steps": 73, "total_steps": 123, "loss": 0.465, "lr": 7.518215581897763e-06, "epoch": 1.7804878048780488, "percentage": 59.35, "elapsed_time": "0:08:37", "remaining_time": "0:05:54"}
|
74 |
+
{"current_steps": 74, "total_steps": 123, "loss": 0.4406, "lr": 7.263370099279173e-06, "epoch": 1.8048780487804879, "percentage": 60.16, "elapsed_time": "0:08:46", "remaining_time": "0:05:48"}
|
75 |
+
{"current_steps": 75, "total_steps": 123, "loss": 0.402, "lr": 7.010431818542298e-06, "epoch": 1.8292682926829267, "percentage": 60.98, "elapsed_time": "0:08:53", "remaining_time": "0:05:41"}
|
76 |
+
{"current_steps": 76, "total_steps": 123, "loss": 0.4467, "lr": 6.759577016488343e-06, "epoch": 1.8536585365853657, "percentage": 61.79, "elapsed_time": "0:09:00", "remaining_time": "0:05:34"}
|
77 |
+
{"current_steps": 77, "total_steps": 123, "loss": 0.441, "lr": 6.510980517908334e-06, "epoch": 1.8780487804878048, "percentage": 62.6, "elapsed_time": "0:09:07", "remaining_time": "0:05:26"}
|
78 |
+
{"current_steps": 78, "total_steps": 123, "loss": 0.443, "lr": 6.264815573744884e-06, "epoch": 1.9024390243902438, "percentage": 63.41, "elapsed_time": "0:09:14", "remaining_time": "0:05:19"}
|
79 |
+
{"current_steps": 79, "total_steps": 123, "loss": 0.4501, "lr": 6.021253740350793e-06, "epoch": 1.9268292682926829, "percentage": 64.23, "elapsed_time": "0:09:20", "remaining_time": "0:05:12"}
|
80 |
+
{"current_steps": 80, "total_steps": 123, "loss": 0.4567, "lr": 5.780464759928623e-06, "epoch": 1.951219512195122, "percentage": 65.04, "elapsed_time": "0:09:27", "remaining_time": "0:05:05"}
|
81 |
+
{"current_steps": 81, "total_steps": 123, "loss": 0.478, "lr": 5.542616442234618e-06, "epoch": 1.975609756097561, "percentage": 65.85, "elapsed_time": "0:09:34", "remaining_time": "0:04:57"}
|
82 |
+
{"current_steps": 82, "total_steps": 123, "loss": 0.3885, "lr": 5.307874547629339e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:09:42", "remaining_time": "0:04:51"}
|
83 |
+
{"current_steps": 83, "total_steps": 123, "loss": 0.2847, "lr": 5.076402671556578e-06, "epoch": 2.024390243902439, "percentage": 67.48, "elapsed_time": "0:09:48", "remaining_time": "0:04:43"}
|
84 |
+
{"current_steps": 84, "total_steps": 123, "loss": 0.2241, "lr": 4.848362130531039e-06, "epoch": 2.048780487804878, "percentage": 68.29, "elapsed_time": "0:09:56", "remaining_time": "0:04:36"}
|
85 |
+
{"current_steps": 85, "total_steps": 123, "loss": 0.2681, "lr": 4.623911849714226e-06, "epoch": 2.073170731707317, "percentage": 69.11, "elapsed_time": "0:10:03", "remaining_time": "0:04:29"}
|
86 |
+
{"current_steps": 86, "total_steps": 123, "loss": 0.2467, "lr": 4.403208252156921e-06, "epoch": 2.097560975609756, "percentage": 69.92, "elapsed_time": "0:10:09", "remaining_time": "0:04:22"}
|
87 |
+
{"current_steps": 87, "total_steps": 123, "loss": 0.2331, "lr": 4.186405149785403e-06, "epoch": 2.1219512195121952, "percentage": 70.73, "elapsed_time": "0:10:16", "remaining_time": "0:04:15"}
|
88 |
+
{"current_steps": 88, "total_steps": 123, "loss": 0.2126, "lr": 3.973653636207437e-06, "epoch": 2.1463414634146343, "percentage": 71.54, "elapsed_time": "0:10:24", "remaining_time": "0:04:08"}
|
89 |
+
{"current_steps": 89, "total_steps": 123, "loss": 0.2171, "lr": 3.7651019814126656e-06, "epoch": 2.1707317073170733, "percentage": 72.36, "elapsed_time": "0:10:31", "remaining_time": "0:04:01"}
|
90 |
+
{"current_steps": 90, "total_steps": 123, "loss": 0.2234, "lr": 3.560895528440844e-06, "epoch": 2.1951219512195124, "percentage": 73.17, "elapsed_time": "0:10:39", "remaining_time": "0:03:54"}
|
91 |
+
{"current_steps": 91, "total_steps": 123, "loss": 0.2361, "lr": 3.361176592089919e-06, "epoch": 2.2195121951219514, "percentage": 73.98, "elapsed_time": "0:10:46", "remaining_time": "0:03:47"}
|
92 |
+
{"current_steps": 92, "total_steps": 123, "loss": 0.2066, "lr": 3.1660843597345137e-06, "epoch": 2.2439024390243905, "percentage": 74.8, "elapsed_time": "0:10:52", "remaining_time": "0:03:40"}
|
93 |
+
{"current_steps": 93, "total_steps": 123, "loss": 0.202, "lr": 2.975754794324015e-06, "epoch": 2.2682926829268295, "percentage": 75.61, "elapsed_time": "0:10:59", "remaining_time": "0:03:32"}
|
94 |
+
{"current_steps": 94, "total_steps": 123, "loss": 0.2301, "lr": 2.7903205396277546e-06, "epoch": 2.292682926829268, "percentage": 76.42, "elapsed_time": "0:11:06", "remaining_time": "0:03:25"}
|
95 |
+
{"current_steps": 95, "total_steps": 123, "loss": 0.2267, "lr": 2.6099108277934105e-06, "epoch": 2.317073170731707, "percentage": 77.24, "elapsed_time": "0:11:13", "remaining_time": "0:03:18"}
|
96 |
+
{"current_steps": 96, "total_steps": 123, "loss": 0.2073, "lr": 2.4346513892830427e-06, "epoch": 2.341463414634146, "percentage": 78.05, "elapsed_time": "0:11:20", "remaining_time": "0:03:11"}
|
97 |
+
{"current_steps": 97, "total_steps": 123, "loss": 0.1988, "lr": 2.2646643652494693e-06, "epoch": 2.3658536585365852, "percentage": 78.86, "elapsed_time": "0:11:27", "remaining_time": "0:03:04"}
|
98 |
+
{"current_steps": 98, "total_steps": 123, "loss": 0.2421, "lr": 2.100068222414121e-06, "epoch": 2.3902439024390243, "percentage": 79.67, "elapsed_time": "0:11:34", "remaining_time": "0:02:57"}
|
99 |
+
{"current_steps": 99, "total_steps": 123, "loss": 0.1964, "lr": 1.9409776705056514e-06, "epoch": 2.4146341463414633, "percentage": 80.49, "elapsed_time": "0:11:42", "remaining_time": "0:02:50"}
|
100 |
+
{"current_steps": 100, "total_steps": 123, "loss": 0.2024, "lr": 1.7875035823168641e-06, "epoch": 2.4390243902439024, "percentage": 81.3, "elapsed_time": "0:11:49", "remaining_time": "0:02:43"}
|
101 |
+
{"current_steps": 101, "total_steps": 123, "loss": 0.2042, "lr": 1.6397529164356606e-06, "epoch": 2.4634146341463414, "percentage": 82.11, "elapsed_time": "0:11:56", "remaining_time": "0:02:36"}
|
102 |
+
{"current_steps": 102, "total_steps": 123, "loss": 0.2048, "lr": 1.4978286427038602e-06, "epoch": 2.4878048780487805, "percentage": 82.93, "elapsed_time": "0:12:02", "remaining_time": "0:02:28"}
|
103 |
+
{"current_steps": 103, "total_steps": 123, "loss": 0.1898, "lr": 1.3618296704558364e-06, "epoch": 2.5121951219512195, "percentage": 83.74, "elapsed_time": "0:12:11", "remaining_time": "0:02:21"}
|
104 |
+
{"current_steps": 104, "total_steps": 123, "loss": 0.2347, "lr": 1.2318507795870138e-06, "epoch": 2.5365853658536586, "percentage": 84.55, "elapsed_time": "0:12:18", "remaining_time": "0:02:14"}
|
105 |
+
{"current_steps": 105, "total_steps": 123, "loss": 0.2189, "lr": 1.1079825545001887e-06, "epoch": 2.5609756097560976, "percentage": 85.37, "elapsed_time": "0:12:24", "remaining_time": "0:02:07"}
|
106 |
+
{"current_steps": 106, "total_steps": 123, "loss": 0.2008, "lr": 9.903113209758098e-07, "epoch": 2.5853658536585367, "percentage": 86.18, "elapsed_time": "0:12:31", "remaining_time": "0:02:00"}
|
107 |
+
{"current_steps": 107, "total_steps": 123, "loss": 0.2044, "lr": 8.789190860101226e-07, "epoch": 2.6097560975609757, "percentage": 86.99, "elapsed_time": "0:12:38", "remaining_time": "0:01:53"}
|
108 |
+
{"current_steps": 108, "total_steps": 123, "loss": 0.1971, "lr": 7.738834806631712e-07, "epoch": 2.6341463414634148, "percentage": 87.8, "elapsed_time": "0:12:46", "remaining_time": "0:01:46"}
|
109 |
+
{"current_steps": 109, "total_steps": 123, "loss": 0.2154, "lr": 6.752777059564431e-07, "epoch": 2.658536585365854, "percentage": 88.62, "elapsed_time": "0:12:52", "remaining_time": "0:01:39"}
|
110 |
+
{"current_steps": 110, "total_steps": 123, "loss": 0.2208, "lr": 5.831704818578842e-07, "epoch": 2.682926829268293, "percentage": 89.43, "elapsed_time": "0:12:59", "remaining_time": "0:01:32"}
|
111 |
+
{"current_steps": 111, "total_steps": 123, "loss": 0.1765, "lr": 4.976259993898503e-07, "epoch": 2.7073170731707314, "percentage": 90.24, "elapsed_time": "0:13:05", "remaining_time": "0:01:24"}
|
112 |
+
{"current_steps": 112, "total_steps": 123, "loss": 0.208, "lr": 4.187038758933204e-07, "epoch": 2.7317073170731705, "percentage": 91.06, "elapsed_time": "0:13:11", "remaining_time": "0:01:17"}
|
113 |
+
{"current_steps": 113, "total_steps": 123, "loss": 0.2152, "lr": 3.4645911347961357e-07, "epoch": 2.7560975609756095, "percentage": 91.87, "elapsed_time": "0:13:18", "remaining_time": "0:01:10"}
|
114 |
+
{"current_steps": 114, "total_steps": 123, "loss": 0.2054, "lr": 2.809420606985236e-07, "epoch": 2.7804878048780486, "percentage": 92.68, "elapsed_time": "0:13:26", "remaining_time": "0:01:03"}
|
115 |
+
{"current_steps": 115, "total_steps": 123, "loss": 0.2105, "lr": 2.2219837744959284e-07, "epoch": 2.8048780487804876, "percentage": 93.5, "elapsed_time": "0:13:32", "remaining_time": "0:00:56"}
|
116 |
+
{"current_steps": 116, "total_steps": 123, "loss": 0.1872, "lr": 1.7026900316098217e-07, "epoch": 2.8292682926829267, "percentage": 94.31, "elapsed_time": "0:13:38", "remaining_time": "0:00:49"}
|
117 |
+
{"current_steps": 117, "total_steps": 123, "loss": 0.1979, "lr": 1.2519012825812804e-07, "epoch": 2.8536585365853657, "percentage": 95.12, "elapsed_time": "0:13:45", "remaining_time": "0:00:42"}
|
118 |
+
{"current_steps": 118, "total_steps": 123, "loss": 0.1883, "lr": 8.699316894203225e-08, "epoch": 2.8780487804878048, "percentage": 95.93, "elapsed_time": "0:13:53", "remaining_time": "0:00:35"}
|
119 |
+
{"current_steps": 119, "total_steps": 123, "loss": 0.1978, "lr": 5.5704745294815624e-08, "epoch": 2.902439024390244, "percentage": 96.75, "elapsed_time": "0:14:01", "remaining_time": "0:00:28"}
|
120 |
+
{"current_steps": 120, "total_steps": 123, "loss": 0.2007, "lr": 3.134666272774034e-08, "epoch": 2.926829268292683, "percentage": 97.56, "elapsed_time": "0:14:08", "remaining_time": "0:00:21"}
|
121 |
+
{"current_steps": 121, "total_steps": 123, "loss": 0.1945, "lr": 1.3935896784663671e-08, "epoch": 2.951219512195122, "percentage": 98.37, "elapsed_time": "0:14:16", "remaining_time": "0:00:14"}
|
122 |
+
{"current_steps": 122, "total_steps": 123, "loss": 0.188, "lr": 3.4845813115114147e-09, "epoch": 2.975609756097561, "percentage": 99.19, "elapsed_time": "0:14:24", "remaining_time": "0:00:07"}
|
123 |
+
{"current_steps": 123, "total_steps": 123, "loss": 0.1623, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:14:31", "remaining_time": "0:00:00"}
|
124 |
+
{"current_steps": 123, "total_steps": 123, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:15:27", "remaining_time": "0:00:00"}
|