Training in progress, step 2000

Browse files

Files changed (13) hide show

{checkpoint-1000 → checkpoint-2000}/config.json +0 -0
{checkpoint-1000 → checkpoint-2000}/optimizer.pt +1 -1
{checkpoint-1000 → checkpoint-2000}/pytorch_model.bin +1 -1
{checkpoint-1000 → checkpoint-2000}/rng_state.pth +1 -1
{checkpoint-1000 → checkpoint-2000}/scheduler.pt +1 -1
{checkpoint-1000 → checkpoint-2000}/special_tokens_map.json +0 -0
{checkpoint-1000 → checkpoint-2000}/tokenizer.json +0 -0
{checkpoint-1000 → checkpoint-2000}/tokenizer_config.json +0 -0
{checkpoint-1000 → checkpoint-2000}/trainer_state.json +211 -3
{checkpoint-1000 → checkpoint-2000}/training_args.bin +0 -0
{checkpoint-1000 → checkpoint-2000}/vocab.txt +0 -0
pytorch_model.bin +1 -1
runs/Jul23_00-54-01_c587bebf8fcc/events.out.tfevents.1690073651.c587bebf8fcc.2239.0 +2 -2

{checkpoint-1000 → checkpoint-2000}/config.json RENAMED Viewed

File without changes

{checkpoint-1000 → checkpoint-2000}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d32e8828d1b1ae30530b7473d552ff9aa020e0b2f239c8b8134dfe979d15c0b
 size 267028677

 version https://git-lfs.github.com/spec/v1
+oid sha256:09552910dd7d5ed2eb865c6b30253726e3dcd7aed3588cc97c4702b013630f01
 size 267028677

{checkpoint-1000 → checkpoint-2000}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c366631ade427ba5a8dc8df9ca9f8d8f41caf8fad5eb2ca4c35c6fc3113ee13f
 size 133523761

 version https://git-lfs.github.com/spec/v1
+oid sha256:294d34cfcdd9a17427a0a09cdf19e071c82e8ce59c34f4fe159d3c5118d1082d
 size 133523761

{checkpoint-1000 → checkpoint-2000}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:46f76c8bed144eb0462eae7b352d4482d3ae98f3e4263329c2f739c21b5dd5ca
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:4f48f6150f5133b116ca71b75680965f3b45ab43582cfcc6566086e18896784f
 size 14575

{checkpoint-1000 → checkpoint-2000}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:13828e1677406f24ffee2b52c5ac79b462a76afddafb014a11a21dd7429637dd
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:0ad0c62478b179935d131a5f36054eef5c951ef7612bbd788e7a63be9d94d8ef
 size 627

{checkpoint-1000 → checkpoint-2000}/special_tokens_map.json RENAMED Viewed

File without changes

{checkpoint-1000 → checkpoint-2000}/tokenizer.json RENAMED Viewed

File without changes

{checkpoint-1000 → checkpoint-2000}/tokenizer_config.json RENAMED Viewed

File without changes

{checkpoint-1000 → checkpoint-2000}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 4.0,
-  "global_step": 1000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -220,11 +220,219 @@
       "eval_system_ram_total": 83.48074722290039,
       "eval_system_ram_used": 3.8976211547851562,
       "step": 1000
     }
   ],
   "max_steps": 2500,
   "num_train_epochs": 10,
-  "total_flos": 504019356005760.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 8.0,
+  "global_step": 2000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_system_ram_total": 83.48074722290039,
       "eval_system_ram_used": 3.8976211547851562,
       "step": 1000
+    },
+    {
+      "epoch": 4.5,
+      "learning_rate": 1.1008e-05,
+      "loss": 0.8512,
+      "step": 1125
+    },
+    {
+      "epoch": 4.5,
+      "eval_accuracy": 0.6915,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 25.830577850341797,
+      "eval_f1": 0.6913447845710189,
+      "eval_gpu_ram_allocated": 0.3996849060058594,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.0628596544265747,
+      "eval_precision": 0.6944500140220231,
+      "eval_recall": 0.6915,
+      "eval_runtime": 1.5986,
+      "eval_samples_per_second": 1251.121,
+      "eval_steps_per_second": 39.41,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.0599517822265625,
+      "step": 1125
+    },
+    {
+      "epoch": 5.0,
+      "learning_rate": 1.0008e-05,
+      "loss": 0.8121,
+      "step": 1250
+    },
+    {
+      "epoch": 5.0,
+      "eval_accuracy": 0.691,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 25.830596923828125,
+      "eval_f1": 0.6838005278906992,
+      "eval_gpu_ram_allocated": 0.39963626861572266,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 31,
+      "eval_loss": 1.0575964450836182,
+      "eval_precision": 0.6905089592227732,
+      "eval_recall": 0.691,
+      "eval_runtime": 1.5391,
+      "eval_samples_per_second": 1299.447,
+      "eval_steps_per_second": 40.933,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.043186187744141,
+      "step": 1250
+    },
+    {
+      "epoch": 5.5,
+      "learning_rate": 9.008e-06,
+      "loss": 0.7733,
+      "step": 1375
+    },
+    {
+      "epoch": 5.5,
+      "eval_accuracy": 0.6805,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 25.83068084716797,
+      "eval_f1": 0.6773653982197514,
+      "eval_gpu_ram_allocated": 0.3996090888977051,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.0597690343856812,
+      "eval_precision": 0.683800229871734,
+      "eval_recall": 0.6805,
+      "eval_runtime": 1.5511,
+      "eval_samples_per_second": 1289.373,
+      "eval_steps_per_second": 40.615,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.837909698486328,
+      "step": 1375
+    },
+    {
+      "epoch": 6.0,
+      "learning_rate": 8.008e-06,
+      "loss": 0.7431,
+      "step": 1500
+    },
+    {
+      "epoch": 6.0,
+      "eval_accuracy": 0.702,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 25.830699920654297,
+      "eval_f1": 0.6973584149072398,
+      "eval_gpu_ram_allocated": 0.39962053298950195,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 31,
+      "eval_loss": 1.0375711917877197,
+      "eval_precision": 0.6975777506719404,
+      "eval_recall": 0.702,
+      "eval_runtime": 1.5383,
+      "eval_samples_per_second": 1300.155,
+      "eval_steps_per_second": 40.955,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.8545989990234375,
+      "step": 1500
+    },
+    {
+      "epoch": 6.5,
+      "learning_rate": 7.0080000000000005e-06,
+      "loss": 0.7065,
+      "step": 1625
+    },
+    {
+      "epoch": 6.5,
+      "eval_accuracy": 0.6995,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.203968048095703,
+      "eval_f1": 0.6990180197515704,
+      "eval_gpu_ram_allocated": 0.39959049224853516,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.0457407236099243,
+      "eval_precision": 0.701399008937391,
+      "eval_recall": 0.6995,
+      "eval_runtime": 1.5796,
+      "eval_samples_per_second": 1266.127,
+      "eval_steps_per_second": 39.883,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.033943176269531,
+      "step": 1625
+    },
+    {
+      "epoch": 7.0,
+      "learning_rate": 6.008000000000001e-06,
+      "loss": 0.671,
+      "step": 1750
+    },
+    {
+      "epoch": 7.0,
+      "eval_accuracy": 0.698,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.203968048095703,
+      "eval_f1": 0.6956310421863513,
+      "eval_gpu_ram_allocated": 0.39962339401245117,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.039590835571289,
+      "eval_precision": 0.696566876815876,
+      "eval_recall": 0.698,
+      "eval_runtime": 1.5301,
+      "eval_samples_per_second": 1307.136,
+      "eval_steps_per_second": 41.175,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.038356781005859,
+      "step": 1750
+    },
+    {
+      "epoch": 7.5,
+      "learning_rate": 5.008000000000001e-06,
+      "loss": 0.6438,
+      "step": 1875
+    },
+    {
+      "epoch": 7.5,
+      "eval_accuracy": 0.6925,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.203964233398438,
+      "eval_f1": 0.6886960392924729,
+      "eval_gpu_ram_allocated": 0.3995976448059082,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.0473765134811401,
+      "eval_precision": 0.6906747949914751,
+      "eval_recall": 0.6925,
+      "eval_runtime": 1.5569,
+      "eval_samples_per_second": 1284.611,
+      "eval_steps_per_second": 40.465,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.827362060546875,
+      "step": 1875
+    },
+    {
+      "epoch": 8.0,
+      "learning_rate": 4.008e-06,
+      "loss": 0.6326,
+      "step": 2000
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.698,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.204063415527344,
+      "eval_f1": 0.6972467602684949,
+      "eval_gpu_ram_allocated": 0.39958906173706055,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 34,
+      "eval_loss": 1.03837251663208,
+      "eval_precision": 0.6982790583069545,
+      "eval_recall": 0.698,
+      "eval_runtime": 1.5106,
+      "eval_samples_per_second": 1323.952,
+      "eval_steps_per_second": 41.704,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.8401947021484375,
+      "step": 2000
     }
   ],
   "max_steps": 2500,
   "num_train_epochs": 10,
+  "total_flos": 1010109883418496.0,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-1000 → checkpoint-2000}/training_args.bin RENAMED Viewed

File without changes

{checkpoint-1000 → checkpoint-2000}/vocab.txt RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f999c13d7f0a2621e532de7860c6e7dc21666552e25f1fbe53bc03deab0da720
 size 133523761

 version https://git-lfs.github.com/spec/v1
+oid sha256:294d34cfcdd9a17427a0a09cdf19e071c82e8ce59c34f4fe159d3c5118d1082d
 size 133523761

runs/Jul23_00-54-01_c587bebf8fcc/events.out.tfevents.1690073651.c587bebf8fcc.2239.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ceb3666a0265e2a6fc0d5ffc3b2dd8c1c85a7f4686342050f7bcf179e6a213fd
-size 18081

 version https://git-lfs.github.com/spec/v1
+oid sha256:0a87e472813cf54d514cc70f3dcc6d715385ff7ad568595a73f287577b33a094
+size 22489