Training in progress, step 250000

Browse files

Files changed (8) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +2 -2
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +77 -3
last-checkpoint/training_args.bin +1 -1
pytorch_model.bin +1 -1
training_args.bin +1 -1

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:11144856c02c8e972a36fb5b42d4223035071c4a917ea79c06d582d2b9be6085
 size 893441530

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce3e998a193326c567e5bf36b4614bcf9a92a873dabc8d985ee1ad116cb61ad2
 size 893441530

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1ad81878847ff45e1880bc9e193537b6a982e87fb64a13bbf06eba84c2c3ee6f
 size 454197066

 version https://git-lfs.github.com/spec/v1
+oid sha256:36acb3092fbd4cafad2bc39be38c35f4299b28e4d00c2f26079a5a4d3580780f
 size 454197066

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:20be28e08eeb080e0d87de2c1d006e31a433ae3d529b46a69dfe770492fd995c
-size 14180

 version https://git-lfs.github.com/spec/v1
+oid sha256:58f82edd7a6194c8353e8edba667f026c5f098b23c6a725d52469afb859bd8fc
+size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c781a803fdb01dba917962146262a56eb080213a823923503263cf460fa3ac80
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:e57954a9914278616526cbeea30401601bc7a6e242a7a52a60b8796e825a3c98
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.24,
-  "global_step": 240000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1782,11 +1782,85 @@
       "eval_samples_per_second": 99.85,
       "eval_steps_per_second": 12.481,
       "step": 240000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 2.125106441575465e+21,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.25,
+  "global_step": 250000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 99.85,
       "eval_steps_per_second": 12.481,
       "step": 240000
+    },
+    {
+      "epoch": 0.24,
+      "learning_rate": 1.7905926017192613e-05,
+      "loss": 0.3632,
+      "step": 241000
+    },
+    {
+      "epoch": 0.24,
+      "learning_rate": 1.7897364070353612e-05,
+      "loss": 0.3633,
+      "step": 242000
+    },
+    {
+      "epoch": 0.24,
+      "learning_rate": 1.788876360350547e-05,
+      "loss": 0.3628,
+      "step": 243000
+    },
+    {
+      "epoch": 0.24,
+      "learning_rate": 1.7880124710701515e-05,
+      "loss": 0.3628,
+      "step": 244000
+    },
+    {
+      "epoch": 0.24,
+      "learning_rate": 1.7871447486415292e-05,
+      "loss": 0.363,
+      "step": 245000
+    },
+    {
+      "epoch": 0.24,
+      "eval_runtime": 3598.9717,
+      "eval_samples_per_second": 94.375,
+      "eval_steps_per_second": 11.797,
+      "step": 245000
+    },
+    {
+      "epoch": 0.25,
+      "learning_rate": 1.7862732025539543e-05,
+      "loss": 0.364,
+      "step": 246000
+    },
+    {
+      "epoch": 0.25,
+      "learning_rate": 1.7853978423385145e-05,
+      "loss": 0.3626,
+      "step": 247000
+    },
+    {
+      "epoch": 0.25,
+      "learning_rate": 1.784518677568009e-05,
+      "loss": 0.361,
+      "step": 248000
+    },
+    {
+      "epoch": 0.25,
+      "learning_rate": 1.783635717856843e-05,
+      "loss": 0.3597,
+      "step": 249000
+    },
+    {
+      "epoch": 0.25,
+      "learning_rate": 1.782748972860922e-05,
+      "loss": 0.3626,
+      "step": 250000
+    },
+    {
+      "epoch": 0.25,
+      "eval_runtime": 2943.8602,
+      "eval_samples_per_second": 115.376,
+      "eval_steps_per_second": 14.422,
+      "step": 250000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 2.213652543307776e+21,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b02dcd885a628a7855e3e0c6a6edcce3320ca6c2778748fda625b892498f6832
 size 3768

 version https://git-lfs.github.com/spec/v1
+oid sha256:04b59685dedbedfa441a393ef0561d0eeade03f2fa8b31fadfbec3e0393ee18f
 size 3768

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1ad81878847ff45e1880bc9e193537b6a982e87fb64a13bbf06eba84c2c3ee6f
 size 454197066

 version https://git-lfs.github.com/spec/v1
+oid sha256:36acb3092fbd4cafad2bc39be38c35f4299b28e4d00c2f26079a5a4d3580780f
 size 454197066

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b02dcd885a628a7855e3e0c6a6edcce3320ca6c2778748fda625b892498f6832
 size 3768

 version https://git-lfs.github.com/spec/v1
+oid sha256:04b59685dedbedfa441a393ef0561d0eeade03f2fa8b31fadfbec3e0393ee18f
 size 3768