Model save

Files changed (5) hide show

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
-    "train_loss": 2.116673701227048,
-    "train_runtime": 309.01,
-    "train_samples": 30000,
-    "train_samples_per_second": 291.253,
-    "train_steps_per_second": 1.146
 }

 {
     "epoch": 3.0,
+    "train_loss": 4.621011098225911,
+    "train_runtime": 40.2046,
+    "train_samples": 3000,
+    "train_samples_per_second": 223.855,
+    "train_steps_per_second": 0.895
 }

args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:84681b490574eec665dd628028717bdc85fbdb7ad3d54c8ed025f6816f1b69f3
 size 5652

 version https://git-lfs.github.com/spec/v1
+oid sha256:d40abfa4155cddcba82cbf65e16136b1f7f02f9059737d9f4180121e5bafbba5
 size 5652

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
-    "train_loss": 2.116673701227048,
-    "train_runtime": 309.01,
-    "train_samples": 30000,
-    "train_samples_per_second": 291.253,
-    "train_steps_per_second": 1.146
 }

 {
     "epoch": 3.0,
+    "train_loss": 4.621011098225911,
+    "train_runtime": 40.2046,
+    "train_samples": 3000,
+    "train_samples_per_second": 223.855,
+    "train_steps_per_second": 0.895
 }

trainer_state.json CHANGED Viewed

@@ -3,26 +3,26 @@
   "best_model_checkpoint": null,
   "epoch": 3.0,
   "eval_steps": 500,
-  "global_step": 354,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 3.0,
-      "step": 354,
-      "total_flos": 8819084252160000.0,
-      "train_loss": 2.116673701227048,
-      "train_runtime": 309.01,
-      "train_samples_per_second": 291.253,
-      "train_steps_per_second": 1.146
     }
   ],
   "logging_steps": 500,
-  "max_steps": 354,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 8819084252160000.0,
   "trial_name": null,
   "trial_params": null
 }

   "best_model_checkpoint": null,
   "epoch": 3.0,
   "eval_steps": 500,
+  "global_step": 36,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
   "log_history": [
     {
       "epoch": 3.0,
+      "step": 36,
+      "total_flos": 881908425216000.0,
+      "train_loss": 4.621011098225911,
+      "train_runtime": 40.2046,
+      "train_samples_per_second": 223.855,
+      "train_steps_per_second": 0.895
     }
   ],
   "logging_steps": 500,
+  "max_steps": 36,
   "num_train_epochs": 3,
   "save_steps": 500,
+  "total_flos": 881908425216000.0,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ed62376ecc90c8a01bbc2f29b3d92d6ab6a87975e9b65b07bf2310214f6493ce
 size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c21a7a1d71fbc7505829b21472df420af8d762d2ec82196f32ef3365d115b7e
 size 4664