Training in progress, epoch 1

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:657be1bfded62b841a1e769ecd60f2c3027dfa2ad74369d3deec8017c37994cd
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:87a9bebf99a12d846d8accd01a5e667b4678cd0795ef22a497d4250a8def8b78
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4438d7928ec9af04d96f0b2815b25dbcdd7404da01c9a8bde48f1a7305ed171a
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed8fb818c662bf7f752cdc934bcaf217d8c97e42f49b0f51a4124601e3f84b33
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5cf74072a330f4b5081e0778816d1942e6790656a161767aa5edaad7dc09d1d2
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:cff79f7bbd0831776168b8f177d580837f64668af3f3a96405204c889cf54269
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2663c8c77b188d9055dcaa070be145348ac85da8b5d506d37d3e1b559507d081
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:6aa56d70608a7852cb0b8cbb49e9656ec9db92342a500b9f5a1d899fdcf6d2e4
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -1,3 +1,6 @@
 {"current_steps": 10, "total_steps": 60, "loss": 1.1263, "lr": 5e-06, "epoch": 0.48484848484848486, "percentage": 16.67, "elapsed_time": "0:09:38", "remaining_time": "0:48:13"}
 {"current_steps": 20, "total_steps": 60, "loss": 1.0663, "lr": 5e-06, "epoch": 0.9696969696969697, "percentage": 33.33, "elapsed_time": "0:19:12", "remaining_time": "0:38:24"}
 {"current_steps": 20, "total_steps": 60, "eval_loss": 1.1175479888916016, "epoch": 0.9696969696969697, "percentage": 33.33, "elapsed_time": "0:20:09", "remaining_time": "0:40:19"}

 {"current_steps": 10, "total_steps": 60, "loss": 1.1263, "lr": 5e-06, "epoch": 0.48484848484848486, "percentage": 16.67, "elapsed_time": "0:09:38", "remaining_time": "0:48:13"}
 {"current_steps": 20, "total_steps": 60, "loss": 1.0663, "lr": 5e-06, "epoch": 0.9696969696969697, "percentage": 33.33, "elapsed_time": "0:19:12", "remaining_time": "0:38:24"}
 {"current_steps": 20, "total_steps": 60, "eval_loss": 1.1175479888916016, "epoch": 0.9696969696969697, "percentage": 33.33, "elapsed_time": "0:20:09", "remaining_time": "0:40:19"}
+{"current_steps": 30, "total_steps": 60, "loss": 1.0693, "lr": 5e-06, "epoch": 1.4545454545454546, "percentage": 50.0, "elapsed_time": "0:30:20", "remaining_time": "0:30:20"}
+{"current_steps": 40, "total_steps": 60, "loss": 0.9594, "lr": 5e-06, "epoch": 1.9393939393939394, "percentage": 66.67, "elapsed_time": "0:39:54", "remaining_time": "0:19:57"}
+{"current_steps": 41, "total_steps": 60, "eval_loss": 0.9644138813018799, "epoch": 1.9878787878787878, "percentage": 68.33, "elapsed_time": "0:41:23", "remaining_time": "0:19:11"}