Femboyuwu2000 commited on
Commit
3fefd82
1 Parent(s): 1205456

Training in progress, step 980, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd6935101c95c7a3fcf35393fcef907ca744d140d002e80f3e1ab8bc68740781
3
  size 13982248
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a38c93e994650fe4c83da9cfce04fe1541ec31a2ec6907ff09b91f14be34ad4d
3
  size 13982248
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:efbc01513003cd4778a5d7c40f35733a97acc954ec9ed9a205fe5bb1048cad2d
3
  size 7062522
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46cbd28b8ea82d833a6eeaf797d7e79113fcfd64f188a19553eb3bcd4a1e3573
3
  size 7062522
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a60dce02b424b527030edce82260ee74eebf81dd57466a5e2b83b22d49a22b4a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c5410d295859629eb5c5221ec007a76d5ecce5c325cbaeb984aecc19e1cfef7
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b961e5bd3f5ce2b76de5850c52ad545f91b84e33c7fc906eadd1fa38681efcd4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1deaeac856492d3d5086d74c9dfcab210016322b2b2c1701903eaa6e0b81545c
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.0768,
5
  "eval_steps": 500,
6
- "global_step": 960,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -343,6 +343,13 @@
343
  "learning_rate": 2.997451764584951e-05,
344
  "loss": 3.7494,
345
  "step": 960
 
 
 
 
 
 
 
346
  }
347
  ],
348
  "logging_steps": 20,
@@ -350,7 +357,7 @@
350
  "num_input_tokens_seen": 0,
351
  "num_train_epochs": 2,
352
  "save_steps": 20,
353
- "total_flos": 2278337822490624.0,
354
  "train_batch_size": 8,
355
  "trial_name": null,
356
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.0784,
5
  "eval_steps": 500,
6
+ "global_step": 980,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
343
  "learning_rate": 2.997451764584951e-05,
344
  "loss": 3.7494,
345
  "step": 960
346
+ },
347
+ {
348
+ "epoch": 0.08,
349
+ "grad_norm": 33.610286712646484,
350
+ "learning_rate": 2.9971608542252175e-05,
351
+ "loss": 3.7077,
352
+ "step": 980
353
  }
354
  ],
355
  "logging_steps": 20,
 
357
  "num_input_tokens_seen": 0,
358
  "num_train_epochs": 2,
359
  "save_steps": 20,
360
+ "total_flos": 2331220953563136.0,
361
  "train_batch_size": 8,
362
  "trial_name": null,
363
  "trial_params": null