sedrickkeh
commited on
Training in progress, step 438
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bdcc5f6cb8a41cf11c8174f01dafe986594cf116f9626d5c07ab2601fce63ce
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f0c448599d3827728eb9b8940743d3acaed1398a19a58c0ac4342222b68ad7c
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dc7b302d3dd8448833ccdf862bec05002338d7c15600c4d0fbd202000486268
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69cb676d884d33ff39e029e9098e1992480d2cc43f622f6591be3ab69a67d055
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -405,3 +405,35 @@
|
|
405 |
{"current_steps": 405, "total_steps": 438, "loss": 0.4562, "lr": 1.7209489588483396e-07, "epoch": 2.7739726027397262, "percentage": 92.47, "elapsed_time": "2:22:50", "remaining_time": "0:11:38"}
|
406 |
{"current_steps": 406, "total_steps": 438, "loss": 0.4405, "lr": 1.6187873328216142e-07, "epoch": 2.780821917808219, "percentage": 92.69, "elapsed_time": "2:23:10", "remaining_time": "0:11:17"}
|
407 |
{"current_steps": 407, "total_steps": 438, "loss": 0.4667, "lr": 1.519701674351265e-07, "epoch": 2.787671232876712, "percentage": 92.92, "elapsed_time": "2:23:31", "remaining_time": "0:10:55"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
405 |
{"current_steps": 405, "total_steps": 438, "loss": 0.4562, "lr": 1.7209489588483396e-07, "epoch": 2.7739726027397262, "percentage": 92.47, "elapsed_time": "2:22:50", "remaining_time": "0:11:38"}
|
406 |
{"current_steps": 406, "total_steps": 438, "loss": 0.4405, "lr": 1.6187873328216142e-07, "epoch": 2.780821917808219, "percentage": 92.69, "elapsed_time": "2:23:10", "remaining_time": "0:11:17"}
|
407 |
{"current_steps": 407, "total_steps": 438, "loss": 0.4667, "lr": 1.519701674351265e-07, "epoch": 2.787671232876712, "percentage": 92.92, "elapsed_time": "2:23:31", "remaining_time": "0:10:55"}
|
408 |
+
{"current_steps": 408, "total_steps": 438, "loss": 0.4426, "lr": 1.4236982830782676e-07, "epoch": 2.7945205479452055, "percentage": 93.15, "elapsed_time": "2:23:51", "remaining_time": "0:10:34"}
|
409 |
+
{"current_steps": 409, "total_steps": 438, "loss": 0.4664, "lr": 1.3307832626800966e-07, "epoch": 2.8013698630136985, "percentage": 93.38, "elapsed_time": "2:24:13", "remaining_time": "0:10:13"}
|
410 |
+
{"current_steps": 410, "total_steps": 438, "loss": 0.4149, "lr": 1.2409625204825802e-07, "epoch": 2.808219178082192, "percentage": 93.61, "elapsed_time": "2:24:34", "remaining_time": "0:09:52"}
|
411 |
+
{"current_steps": 411, "total_steps": 438, "loss": 0.4464, "lr": 1.1542417670844075e-07, "epoch": 2.815068493150685, "percentage": 93.84, "elapsed_time": "2:24:52", "remaining_time": "0:09:31"}
|
412 |
+
{"current_steps": 412, "total_steps": 438, "loss": 0.4472, "lr": 1.0706265159939944e-07, "epoch": 2.821917808219178, "percentage": 94.06, "elapsed_time": "2:25:12", "remaining_time": "0:09:09"}
|
413 |
+
{"current_steps": 413, "total_steps": 438, "loss": 0.4535, "lr": 9.901220832790104e-08, "epoch": 2.828767123287671, "percentage": 94.29, "elapsed_time": "2:25:33", "remaining_time": "0:08:48"}
|
414 |
+
{"current_steps": 414, "total_steps": 438, "loss": 0.4219, "lr": 9.12733587228326e-08, "epoch": 2.8356164383561646, "percentage": 94.52, "elapsed_time": "2:25:52", "remaining_time": "0:08:27"}
|
415 |
+
{"current_steps": 415, "total_steps": 438, "loss": 0.4549, "lr": 8.384659480266733e-08, "epoch": 2.8424657534246576, "percentage": 94.75, "elapsed_time": "2:26:14", "remaining_time": "0:08:06"}
|
416 |
+
{"current_steps": 416, "total_steps": 438, "loss": 0.4469, "lr": 7.673238874417676e-08, "epoch": 2.8493150684931505, "percentage": 94.98, "elapsed_time": "2:26:34", "remaining_time": "0:07:45"}
|
417 |
+
{"current_steps": 417, "total_steps": 438, "loss": 0.4427, "lr": 6.9931192852416e-08, "epoch": 2.856164383561644, "percentage": 95.21, "elapsed_time": "2:26:56", "remaining_time": "0:07:23"}
|
418 |
+
{"current_steps": 418, "total_steps": 438, "loss": 0.4769, "lr": 6.344343953196386e-08, "epoch": 2.863013698630137, "percentage": 95.43, "elapsed_time": "2:27:16", "remaining_time": "0:07:02"}
|
419 |
+
{"current_steps": 419, "total_steps": 438, "loss": 0.439, "lr": 5.726954125943318e-08, "epoch": 2.8698630136986303, "percentage": 95.66, "elapsed_time": "2:27:38", "remaining_time": "0:06:41"}
|
420 |
+
{"current_steps": 420, "total_steps": 438, "loss": 0.4169, "lr": 5.1409890557246876e-08, "epoch": 2.8767123287671232, "percentage": 95.89, "elapsed_time": "2:27:57", "remaining_time": "0:06:20"}
|
421 |
+
{"current_steps": 421, "total_steps": 438, "loss": 0.4413, "lr": 4.586485996867951e-08, "epoch": 2.883561643835616, "percentage": 96.12, "elapsed_time": "2:28:16", "remaining_time": "0:05:59"}
|
422 |
+
{"current_steps": 422, "total_steps": 438, "loss": 0.4463, "lr": 4.063480203417625e-08, "epoch": 2.8904109589041096, "percentage": 96.35, "elapsed_time": "2:28:35", "remaining_time": "0:05:38"}
|
423 |
+
{"current_steps": 423, "total_steps": 438, "loss": 0.4184, "lr": 3.572004926893413e-08, "epoch": 2.897260273972603, "percentage": 96.58, "elapsed_time": "2:28:57", "remaining_time": "0:05:16"}
|
424 |
+
{"current_steps": 424, "total_steps": 438, "loss": 0.4391, "lr": 3.1120914141766214e-08, "epoch": 2.904109589041096, "percentage": 96.8, "elapsed_time": "2:29:16", "remaining_time": "0:04:55"}
|
425 |
+
{"current_steps": 425, "total_steps": 438, "loss": 0.4579, "lr": 2.683768905523243e-08, "epoch": 2.910958904109589, "percentage": 97.03, "elapsed_time": "2:29:38", "remaining_time": "0:04:34"}
|
426 |
+
{"current_steps": 426, "total_steps": 438, "loss": 0.456, "lr": 2.287064632705005e-08, "epoch": 2.9178082191780823, "percentage": 97.26, "elapsed_time": "2:30:00", "remaining_time": "0:04:13"}
|
427 |
+
{"current_steps": 427, "total_steps": 438, "loss": 0.4306, "lr": 1.9220038172780843e-08, "epoch": 2.9246575342465753, "percentage": 97.49, "elapsed_time": "2:30:20", "remaining_time": "0:03:52"}
|
428 |
+
{"current_steps": 428, "total_steps": 438, "loss": 0.4539, "lr": 1.588609668979446e-08, "epoch": 2.9315068493150687, "percentage": 97.72, "elapsed_time": "2:30:41", "remaining_time": "0:03:31"}
|
429 |
+
{"current_steps": 429, "total_steps": 438, "loss": 0.4576, "lr": 1.286903384251581e-08, "epoch": 2.9383561643835616, "percentage": 97.95, "elapsed_time": "2:31:03", "remaining_time": "0:03:10"}
|
430 |
+
{"current_steps": 430, "total_steps": 438, "loss": 0.4464, "lr": 1.016904144894304e-08, "epoch": 2.9452054794520546, "percentage": 98.17, "elapsed_time": "2:31:23", "remaining_time": "0:02:49"}
|
431 |
+
{"current_steps": 431, "total_steps": 438, "loss": 0.471, "lr": 7.78629116845786e-09, "epoch": 2.952054794520548, "percentage": 98.4, "elapsed_time": "2:31:47", "remaining_time": "0:02:27"}
|
432 |
+
{"current_steps": 432, "total_steps": 438, "loss": 0.4357, "lr": 5.720934490907604e-09, "epoch": 2.958904109589041, "percentage": 98.63, "elapsed_time": "2:32:07", "remaining_time": "0:02:06"}
|
433 |
+
{"current_steps": 433, "total_steps": 438, "loss": 0.4451, "lr": 3.973102726976819e-09, "epoch": 2.9657534246575343, "percentage": 98.86, "elapsed_time": "2:32:29", "remaining_time": "0:01:45"}
|
434 |
+
{"current_steps": 434, "total_steps": 438, "loss": 0.4503, "lr": 2.542906999836725e-09, "epoch": 2.9726027397260273, "percentage": 99.09, "elapsed_time": "2:32:50", "remaining_time": "0:01:24"}
|
435 |
+
{"current_steps": 435, "total_steps": 438, "loss": 0.4465, "lr": 1.4304382380819771e-09, "epoch": 2.9794520547945207, "percentage": 99.32, "elapsed_time": "2:33:12", "remaining_time": "0:01:03"}
|
436 |
+
{"current_steps": 436, "total_steps": 438, "loss": 0.4726, "lr": 6.357671699486201e-10, "epoch": 2.9863013698630136, "percentage": 99.54, "elapsed_time": "2:33:34", "remaining_time": "0:00:42"}
|
437 |
+
{"current_steps": 437, "total_steps": 438, "loss": 0.4642, "lr": 1.5894431881657845e-10, "epoch": 2.993150684931507, "percentage": 99.77, "elapsed_time": "2:33:54", "remaining_time": "0:00:21"}
|
438 |
+
{"current_steps": 438, "total_steps": 438, "loss": 0.4255, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:34:13", "remaining_time": "0:00:00"}
|
439 |
+
{"current_steps": 438, "total_steps": 438, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:35:05", "remaining_time": "0:00:00"}
|