diogopaes10 commited on
Commit
8ba813b
β€’
1 Parent(s): 7716bc6

Training in progress, step 7000

Browse files
{checkpoint-6000 β†’ checkpoint-7000}/config.json RENAMED
File without changes
{checkpoint-6000 β†’ checkpoint-7000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cbbd04456094b8f62f81be236b8f37719fbf607db2f5317a245e9f96531d3614
3
  size 267028677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5ce3f709d5bf2ef52f9be3ee11720c11875cd7c7cbc5b113ff2ec13fbdcfad0
3
  size 267028677
{checkpoint-6000 β†’ checkpoint-7000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a5fe9ab1af707e6e666bf9069b7b56e145d52944efdb70375f4c403eaca7195
3
  size 133523761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fdd9c25a3b2561db68e4954c56b65812fa0e930619abfda842bc9c9be92f795
3
  size 133523761
{checkpoint-6000 β†’ checkpoint-7000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b084a0eea70333dcd8dbab59962a7694134fa08b5d76a92944b1542c36edaf1
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29da9df454e7746cda5ce0c1f5109f66bd169affee62d8d85c9b49f078e94f24
3
  size 14575
{checkpoint-6000 β†’ checkpoint-7000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbd027476f4332bd868b6e552f26649d456aa519924fdc5327d6864bb44c7b9e
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faac9c70fa11627d95e4ba1e0d56c13061abc404909001c070224e133cd0adf8
3
  size 627
{checkpoint-6000 β†’ checkpoint-7000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-6000 β†’ checkpoint-7000}/tokenizer.json RENAMED
File without changes
{checkpoint-6000 β†’ checkpoint-7000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-6000 β†’ checkpoint-7000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.4,
5
- "global_step": 6000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -246,11 +246,63 @@
246
  "eval_system_ram_total": 83.48074722290039,
247
  "eval_system_ram_used": 4.057643890380859,
248
  "step": 5625
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
249
  }
250
  ],
251
  "max_steps": 12500,
252
  "num_train_epochs": 5,
253
- "total_flos": 3048208430074752.0,
254
  "trial_name": null,
255
  "trial_params": null
256
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.8,
5
+ "global_step": 7000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
246
  "eval_system_ram_total": 83.48074722290039,
247
  "eval_system_ram_used": 4.057643890380859,
248
  "step": 5625
249
+ },
250
+ {
251
+ "epoch": 2.5,
252
+ "learning_rate": 1.0004800000000001e-05,
253
+ "loss": 0.7523,
254
+ "step": 6250
255
+ },
256
+ {
257
+ "epoch": 2.5,
258
+ "eval_accuracy": 0.734,
259
+ "eval_disk_space_total": 78.1898422241211,
260
+ "eval_disk_space_used": 26.46658706665039,
261
+ "eval_f1": 0.7295923418650617,
262
+ "eval_gpu_ram_allocated": 0.39351463317871094,
263
+ "eval_gpu_ram_cached": 16.05078125,
264
+ "eval_gpu_ram_total": 39.56402587890625,
265
+ "eval_gpu_utilization": 32,
266
+ "eval_loss": 0.8498074412345886,
267
+ "eval_precision": 0.7313935171526833,
268
+ "eval_recall": 0.734,
269
+ "eval_runtime": 15.7189,
270
+ "eval_samples_per_second": 1272.356,
271
+ "eval_steps_per_second": 39.761,
272
+ "eval_system_ram_total": 83.48074722290039,
273
+ "eval_system_ram_used": 3.8655662536621094,
274
+ "step": 6250
275
+ },
276
+ {
277
+ "epoch": 2.75,
278
+ "learning_rate": 9.0048e-06,
279
+ "loss": 0.7396,
280
+ "step": 6875
281
+ },
282
+ {
283
+ "epoch": 2.75,
284
+ "eval_accuracy": 0.73645,
285
+ "eval_disk_space_total": 78.1898422241211,
286
+ "eval_disk_space_used": 26.466869354248047,
287
+ "eval_f1": 0.7326318327243708,
288
+ "eval_gpu_ram_allocated": 0.3934817314147949,
289
+ "eval_gpu_ram_cached": 16.05078125,
290
+ "eval_gpu_ram_total": 39.56402587890625,
291
+ "eval_gpu_utilization": 33,
292
+ "eval_loss": 0.8402908444404602,
293
+ "eval_precision": 0.7323211491997443,
294
+ "eval_recall": 0.73645,
295
+ "eval_runtime": 15.1367,
296
+ "eval_samples_per_second": 1321.295,
297
+ "eval_steps_per_second": 41.29,
298
+ "eval_system_ram_total": 83.48074722290039,
299
+ "eval_system_ram_used": 3.8685684204101562,
300
+ "step": 6875
301
  }
302
  ],
303
  "max_steps": 12500,
304
  "num_train_epochs": 5,
305
+ "total_flos": 3558041889513216.0,
306
  "trial_name": null,
307
  "trial_params": null
308
  }
{checkpoint-6000 β†’ checkpoint-7000}/training_args.bin RENAMED
File without changes
{checkpoint-6000 β†’ checkpoint-7000}/vocab.txt RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54529faf9f7f062e28808f303e29fbb6fd53466445f34fc24c3b8832206ef78e
3
  size 133523761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fdd9c25a3b2561db68e4954c56b65812fa0e930619abfda842bc9c9be92f795
3
  size 133523761
runs/Jul23_01-08-06_df8adf32a670/events.out.tfevents.1690074496.df8adf32a670.1420.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35db62b0f69c0659ee7f59a1fe2522d3881646109a0efa1ddab0e713d968a77c
3
- size 15902
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9ac7f792ea22fc235d1b87725973015b45c098e2f1fae9c2407a9a80a92549f
3
+ size 17004