Training in progress, step 1000, checkpoint

Files changed (5) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73f9709676fd308493096edfefbab55e00200fd0ec9eee8d1c8d9c9b9393dd60
 size 1625426996

 version https://git-lfs.github.com/spec/v1
+oid sha256:2d2170685d0967d98d541384fb9096bbe76c996e2f2ef5d10553264ddc385c8a
 size 1625426996

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:13b3726efa7754053b08c4fa6b30b5a12364126ed953d7f0b1fcf11d22c76b26
 size 3250759951

 version https://git-lfs.github.com/spec/v1
+oid sha256:059e1efd93190766ac5721961dbf55ea0e558cb218646ccd52ba2f24b9c2e591
 size 3250759951

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3e7af7a01e94a9a7176c2bbdf2cb9b8139105cfe65528853ec5a27025100d6bc
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:571b846c9de4671606b4803fe209b7424419cce76e7d83b36c52a236294e4cb0
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e9eeeb5bdd24cb6de6ccdee8afd347d0c5c5a88be6c8e7e24752989eef5c1513
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:6dbaa1691f7b35bc2bd0f7fb06c6d3b2bc869f5776dc79a2f162736695a4d24b
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.2,
   "eval_steps": 500,
-  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -13,13 +13,19 @@
       "learning_rate": 1.869158878504673e-05,
       "loss": 0.4912,
       "step": 500
     }
   ],
   "logging_steps": 500,
   "max_steps": 7500,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 846525235200000.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.4,
   "eval_steps": 500,
+  "global_step": 1000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.869158878504673e-05,
       "loss": 0.4912,
       "step": 500
+    },
+    {
+      "epoch": 0.4,
+      "learning_rate": 1.7356475300400533e-05,
+      "loss": 0.3659,
+      "step": 1000
     }
   ],
   "logging_steps": 500,
   "max_steps": 7500,
   "num_train_epochs": 3,
   "save_steps": 500,
+  "total_flos": 1693050470400000.0,
   "trial_name": null,
   "trial_params": null
 }