diogopaes10 commited on
Commit
3cd1904
β€’
1 Parent(s): b3870a9

Training in progress, step 6000

Browse files
{checkpoint-5000 β†’ checkpoint-6000}/config.json RENAMED
File without changes
{checkpoint-5000 β†’ checkpoint-6000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bee161d119a3ea04cbc152488336fe12942c45f8c6440c64d581a6ae7a63e196
3
  size 267028677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbbd04456094b8f62f81be236b8f37719fbf607db2f5317a245e9f96531d3614
3
  size 267028677
{checkpoint-5000 β†’ checkpoint-6000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:352e9a72b0498ab48a08358e98d0673b58915c4301f40fcfe731efb083ca1d46
3
  size 133523761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a5fe9ab1af707e6e666bf9069b7b56e145d52944efdb70375f4c403eaca7195
3
  size 133523761
{checkpoint-5000 β†’ checkpoint-6000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0555291b2a6c57ddfbb94f07b1757a918e0eee55f74c1919774fc03e4c73ad3
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b084a0eea70333dcd8dbab59962a7694134fa08b5d76a92944b1542c36edaf1
3
  size 14575
{checkpoint-5000 β†’ checkpoint-6000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c13f5c121b0ca6f58116019336ba0d3c1b65f5195038f1617b67d9c0d670124f
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbd027476f4332bd868b6e552f26649d456aa519924fdc5327d6864bb44c7b9e
3
  size 627
{checkpoint-5000 β†’ checkpoint-6000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-5000 β†’ checkpoint-6000}/tokenizer.json RENAMED
File without changes
{checkpoint-5000 β†’ checkpoint-6000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-5000 β†’ checkpoint-6000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.0,
5
- "global_step": 5000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -220,11 +220,37 @@
220
  "eval_system_ram_total": 83.48074722290039,
221
  "eval_system_ram_used": 3.8656463623046875,
222
  "step": 5000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
223
  }
224
  ],
225
  "max_steps": 12500,
226
  "num_train_epochs": 5,
227
- "total_flos": 2542920841875456.0,
228
  "trial_name": null,
229
  "trial_params": null
230
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.4,
5
+ "global_step": 6000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
220
  "eval_system_ram_total": 83.48074722290039,
221
  "eval_system_ram_used": 3.8656463623046875,
222
  "step": 5000
223
+ },
224
+ {
225
+ "epoch": 2.25,
226
+ "learning_rate": 1.10048e-05,
227
+ "loss": 0.7515,
228
+ "step": 5625
229
+ },
230
+ {
231
+ "epoch": 2.25,
232
+ "eval_accuracy": 0.73265,
233
+ "eval_disk_space_total": 78.1898422241211,
234
+ "eval_disk_space_used": 26.46636199951172,
235
+ "eval_f1": 0.7286075365290565,
236
+ "eval_gpu_ram_allocated": 0.3934974670410156,
237
+ "eval_gpu_ram_cached": 16.05078125,
238
+ "eval_gpu_ram_total": 39.56402587890625,
239
+ "eval_gpu_utilization": 32,
240
+ "eval_loss": 0.857990026473999,
241
+ "eval_precision": 0.7324340392002969,
242
+ "eval_recall": 0.73265,
243
+ "eval_runtime": 15.6042,
244
+ "eval_samples_per_second": 1281.705,
245
+ "eval_steps_per_second": 40.053,
246
+ "eval_system_ram_total": 83.48074722290039,
247
+ "eval_system_ram_used": 4.057643890380859,
248
+ "step": 5625
249
  }
250
  ],
251
  "max_steps": 12500,
252
  "num_train_epochs": 5,
253
+ "total_flos": 3048208430074752.0,
254
  "trial_name": null,
255
  "trial_params": null
256
  }
{checkpoint-5000 β†’ checkpoint-6000}/training_args.bin RENAMED
File without changes
{checkpoint-5000 β†’ checkpoint-6000}/vocab.txt RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a67afd612f4a76cdc4e92864450285f686180b7951cb56d2e649f5a12e7d6c33
3
  size 133523761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a5fe9ab1af707e6e666bf9069b7b56e145d52944efdb70375f4c403eaca7195
3
  size 133523761
runs/Jul23_01-08-06_df8adf32a670/events.out.tfevents.1690074496.df8adf32a670.1420.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd2b39e54f4352ae95d2ac35fe20b48d1b9a815dd5b0a3cb67935a686b5bee85
3
- size 13698
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b66d6e8083d4fc61a1407154257c0dbf7b64fbec00463f89013e34bb889a0cd
3
+ size 14800