Training in progress, step 2500

Browse files

Files changed (13) hide show

{checkpoint-1500 → checkpoint-2500}/config.json +0 -0
{checkpoint-1500 → checkpoint-2500}/optimizer.pt +1 -1
{checkpoint-1500 → checkpoint-2500}/pytorch_model.bin +1 -1
{checkpoint-1500 → checkpoint-2500}/rng_state.pth +1 -1
{checkpoint-1500 → checkpoint-2500}/scheduler.pt +1 -1
{checkpoint-1500 → checkpoint-2500}/special_tokens_map.json +0 -0
{checkpoint-1500 → checkpoint-2500}/tokenizer.json +0 -0
{checkpoint-1500 → checkpoint-2500}/tokenizer_config.json +0 -0
{checkpoint-1500 → checkpoint-2500}/trainer_state.json +211 -3
{checkpoint-1500 → checkpoint-2500}/training_args.bin +0 -0
{checkpoint-1500 → checkpoint-2500}/vocab.txt +0 -0
pytorch_model.bin +1 -1
runs/Jul23_00-54-01_c587bebf8fcc/events.out.tfevents.1690073651.c587bebf8fcc.2239.0 +2 -2

{checkpoint-1500 → checkpoint-2500}/config.json RENAMED Viewed

File without changes

{checkpoint-1500 → checkpoint-2500}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ab1734c54c793eae65a52769f5766f6b16b6f36390c14dc1739b4234a106ff18
 size 267028677

 version https://git-lfs.github.com/spec/v1
+oid sha256:e27059fba75966ca72a03e9cc7b0567389190ed68f16253b9591168a0cb597cc
 size 267028677

{checkpoint-1500 → checkpoint-2500}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f999c13d7f0a2621e532de7860c6e7dc21666552e25f1fbe53bc03deab0da720
 size 133523761

 version https://git-lfs.github.com/spec/v1
+oid sha256:a16a1346b21837ee13d52ba582c706fb96643d039a8ec745ade06a4e78deb60b
 size 133523761

{checkpoint-1500 → checkpoint-2500}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:29a5152fbf9e36140a3cd5aa7c29061d9d557b4711f36df08bb03836ef9ea515
 size 14575

 version https://git-lfs.github.com/spec/v1
+oid sha256:aef4ff96e068791b9d58ae396a6507bbeb779c898b52e30a356343311eae07b5
 size 14575

{checkpoint-1500 → checkpoint-2500}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6e32f545d6a13edab9664803abf0214c94c6788b08b3d1c916e39481a4cd4f0c
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:e243256e5ce9269604f12fd0aa4d7ccba676cc02c66217d98097b0986fa106b8
 size 627

{checkpoint-1500 → checkpoint-2500}/special_tokens_map.json RENAMED Viewed

File without changes

{checkpoint-1500 → checkpoint-2500}/tokenizer.json RENAMED Viewed

File without changes

{checkpoint-1500 → checkpoint-2500}/tokenizer_config.json RENAMED Viewed

File without changes

{checkpoint-1500 → checkpoint-2500}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.0,
-  "global_step": 1500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -324,11 +324,219 @@
       "eval_system_ram_total": 83.48074722290039,
       "eval_system_ram_used": 3.8545989990234375,
       "step": 1500
     }
   ],
   "max_steps": 2500,
   "num_train_epochs": 10,
-  "total_flos": 756994619883264.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 10.0,
+  "global_step": 2500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_system_ram_total": 83.48074722290039,
       "eval_system_ram_used": 3.8545989990234375,
       "step": 1500
+    },
+    {
+      "epoch": 6.5,
+      "learning_rate": 7.0080000000000005e-06,
+      "loss": 0.7065,
+      "step": 1625
+    },
+    {
+      "epoch": 6.5,
+      "eval_accuracy": 0.6995,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.203968048095703,
+      "eval_f1": 0.6990180197515704,
+      "eval_gpu_ram_allocated": 0.39959049224853516,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.0457407236099243,
+      "eval_precision": 0.701399008937391,
+      "eval_recall": 0.6995,
+      "eval_runtime": 1.5796,
+      "eval_samples_per_second": 1266.127,
+      "eval_steps_per_second": 39.883,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.033943176269531,
+      "step": 1625
+    },
+    {
+      "epoch": 7.0,
+      "learning_rate": 6.008000000000001e-06,
+      "loss": 0.671,
+      "step": 1750
+    },
+    {
+      "epoch": 7.0,
+      "eval_accuracy": 0.698,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.203968048095703,
+      "eval_f1": 0.6956310421863513,
+      "eval_gpu_ram_allocated": 0.39962339401245117,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.039590835571289,
+      "eval_precision": 0.696566876815876,
+      "eval_recall": 0.698,
+      "eval_runtime": 1.5301,
+      "eval_samples_per_second": 1307.136,
+      "eval_steps_per_second": 41.175,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.038356781005859,
+      "step": 1750
+    },
+    {
+      "epoch": 7.5,
+      "learning_rate": 5.008000000000001e-06,
+      "loss": 0.6438,
+      "step": 1875
+    },
+    {
+      "epoch": 7.5,
+      "eval_accuracy": 0.6925,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.203964233398438,
+      "eval_f1": 0.6886960392924729,
+      "eval_gpu_ram_allocated": 0.3995976448059082,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.0473765134811401,
+      "eval_precision": 0.6906747949914751,
+      "eval_recall": 0.6925,
+      "eval_runtime": 1.5569,
+      "eval_samples_per_second": 1284.611,
+      "eval_steps_per_second": 40.465,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.827362060546875,
+      "step": 1875
+    },
+    {
+      "epoch": 8.0,
+      "learning_rate": 4.008e-06,
+      "loss": 0.6326,
+      "step": 2000
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.698,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.204063415527344,
+      "eval_f1": 0.6972467602684949,
+      "eval_gpu_ram_allocated": 0.39958906173706055,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 34,
+      "eval_loss": 1.03837251663208,
+      "eval_precision": 0.6982790583069545,
+      "eval_recall": 0.698,
+      "eval_runtime": 1.5106,
+      "eval_samples_per_second": 1323.952,
+      "eval_steps_per_second": 41.704,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.8401947021484375,
+      "step": 2000
+    },
+    {
+      "epoch": 8.5,
+      "learning_rate": 3.0080000000000003e-06,
+      "loss": 0.6121,
+      "step": 2125
+    },
+    {
+      "epoch": 8.5,
+      "eval_accuracy": 0.698,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.20423126220703,
+      "eval_f1": 0.6962705560782918,
+      "eval_gpu_ram_allocated": 0.39959049224853516,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 29,
+      "eval_loss": 1.0439949035644531,
+      "eval_precision": 0.6975979381837488,
+      "eval_recall": 0.698,
+      "eval_runtime": 1.5616,
+      "eval_samples_per_second": 1280.706,
+      "eval_steps_per_second": 40.342,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.016208648681641,
+      "step": 2125
+    },
+    {
+      "epoch": 9.0,
+      "learning_rate": 2.008e-06,
+      "loss": 0.5911,
+      "step": 2250
+    },
+    {
+      "epoch": 9.0,
+      "eval_accuracy": 0.701,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.204296112060547,
+      "eval_f1": 0.6995247290600446,
+      "eval_gpu_ram_allocated": 0.3996105194091797,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 28,
+      "eval_loss": 1.0518174171447754,
+      "eval_precision": 0.7006323341620143,
+      "eval_recall": 0.701,
+      "eval_runtime": 1.5659,
+      "eval_samples_per_second": 1277.26,
+      "eval_steps_per_second": 40.234,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 4.033794403076172,
+      "step": 2250
+    },
+    {
+      "epoch": 9.5,
+      "learning_rate": 1.0080000000000001e-06,
+      "loss": 0.592,
+      "step": 2375
+    },
+    {
+      "epoch": 9.5,
+      "eval_accuracy": 0.7035,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.20429229736328,
+      "eval_f1": 0.7022917649865421,
+      "eval_gpu_ram_allocated": 0.3996419906616211,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 27,
+      "eval_loss": 1.0490039587020874,
+      "eval_precision": 0.702476293906477,
+      "eval_recall": 0.7035,
+      "eval_runtime": 1.5585,
+      "eval_samples_per_second": 1283.281,
+      "eval_steps_per_second": 40.423,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.8126220703125,
+      "step": 2375
+    },
+    {
+      "epoch": 10.0,
+      "learning_rate": 8e-09,
+      "loss": 0.5586,
+      "step": 2500
+    },
+    {
+      "epoch": 10.0,
+      "eval_accuracy": 0.701,
+      "eval_disk_space_total": 78.1898422241211,
+      "eval_disk_space_used": 26.204303741455078,
+      "eval_f1": 0.6984193396838297,
+      "eval_gpu_ram_allocated": 0.3996291160583496,
+      "eval_gpu_ram_cached": 12.9296875,
+      "eval_gpu_ram_total": 39.56402587890625,
+      "eval_gpu_utilization": 27,
+      "eval_loss": 1.0510661602020264,
+      "eval_precision": 0.700028711222529,
+      "eval_recall": 0.701,
+      "eval_runtime": 1.5162,
+      "eval_samples_per_second": 1319.056,
+      "eval_steps_per_second": 41.55,
+      "eval_system_ram_total": 83.48074722290039,
+      "eval_system_ram_used": 3.844818115234375,
+      "step": 2500
     }
   ],
   "max_steps": 2500,
   "num_train_epochs": 10,
+  "total_flos": 1262611619041920.0,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-1500 → checkpoint-2500}/training_args.bin RENAMED Viewed

File without changes

{checkpoint-1500 → checkpoint-2500}/vocab.txt RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:294d34cfcdd9a17427a0a09cdf19e071c82e8ce59c34f4fe159d3c5118d1082d
 size 133523761

 version https://git-lfs.github.com/spec/v1
+oid sha256:a16a1346b21837ee13d52ba582c706fb96643d039a8ec745ade06a4e78deb60b
 size 133523761

runs/Jul23_00-54-01_c587bebf8fcc/events.out.tfevents.1690073651.c587bebf8fcc.2239.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0a87e472813cf54d514cc70f3dcc6d715385ff7ad568595a73f287577b33a094
-size 22489

 version https://git-lfs.github.com/spec/v1
+oid sha256:bbecb5c809c6be6c8afb303e013916d04358d96b487dee4dec559b0dcf5d3a75
+size 26897