diogopaes10 commited on
Commit
ee46bfd
β€’
1 Parent(s): 0068b57

Training in progress, step 9000

Browse files
{checkpoint-8000 β†’ checkpoint-9000}/config.json RENAMED
File without changes
{checkpoint-8000 β†’ checkpoint-9000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9abe0e8f69303d52151b969a2c04c7af80d0cf5c07bb60230685b54fb6a90681
3
  size 267028677
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2aaa514a645b3543ce5eed9aa79ddf13738a23c43efec01f7783f6f91edc976
3
  size 267028677
{checkpoint-8000 β†’ checkpoint-9000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b50c95651d8742468f5f1edbb4c2a14528dd86e25791b998adf152efec55c433
3
  size 133523761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79f5061e5a30af545971dc68a923c602fdcaefe82abfb235cb7eb3cfc6f0461e
3
  size 133523761
{checkpoint-8000 β†’ checkpoint-9000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0dc55218bdc42ff7df739a80eaf2657105d315fc0b250d25ef07f483b21f49a9
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8905509a997e07d858d9bf12354f357592c998338dceb452007c9f660165126
3
  size 14575
{checkpoint-8000 β†’ checkpoint-9000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:671cc681d0ecb84643611d2563b43c627f5dae632f0d2170fd28d187ec353ec1
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:119e088f3274dbc64560596e1bafffa29de6f0e97bfe9f98610ffd8b8271fda9
3
  size 627
{checkpoint-8000 β†’ checkpoint-9000}/special_tokens_map.json RENAMED
File without changes
{checkpoint-8000 β†’ checkpoint-9000}/tokenizer.json RENAMED
File without changes
{checkpoint-8000 β†’ checkpoint-9000}/tokenizer_config.json RENAMED
File without changes
{checkpoint-8000 β†’ checkpoint-9000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.2,
5
- "global_step": 8000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -324,11 +324,63 @@
324
  "eval_system_ram_total": 83.48074722290039,
325
  "eval_system_ram_used": 3.8610610961914062,
326
  "step": 7500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
327
  }
328
  ],
329
  "max_steps": 12500,
330
  "num_train_epochs": 5,
331
- "total_flos": 4064276534220672.0,
332
  "trial_name": null,
333
  "trial_params": null
334
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.6,
5
+ "global_step": 9000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
324
  "eval_system_ram_total": 83.48074722290039,
325
  "eval_system_ram_used": 3.8610610961914062,
326
  "step": 7500
327
+ },
328
+ {
329
+ "epoch": 3.25,
330
+ "learning_rate": 7.0048e-06,
331
+ "loss": 0.6929,
332
+ "step": 8125
333
+ },
334
+ {
335
+ "epoch": 3.25,
336
+ "eval_accuracy": 0.73505,
337
+ "eval_disk_space_total": 78.1898422241211,
338
+ "eval_disk_space_used": 26.468040466308594,
339
+ "eval_f1": 0.7321519443896675,
340
+ "eval_gpu_ram_allocated": 0.39360761642456055,
341
+ "eval_gpu_ram_cached": 16.05078125,
342
+ "eval_gpu_ram_total": 39.56402587890625,
343
+ "eval_gpu_utilization": 29,
344
+ "eval_loss": 0.855096697807312,
345
+ "eval_precision": 0.7376195934146232,
346
+ "eval_recall": 0.73505,
347
+ "eval_runtime": 15.2462,
348
+ "eval_samples_per_second": 1311.799,
349
+ "eval_steps_per_second": 40.994,
350
+ "eval_system_ram_total": 83.48074722290039,
351
+ "eval_system_ram_used": 4.056495666503906,
352
+ "step": 8125
353
+ },
354
+ {
355
+ "epoch": 3.5,
356
+ "learning_rate": 6.0048000000000005e-06,
357
+ "loss": 0.6772,
358
+ "step": 8750
359
+ },
360
+ {
361
+ "epoch": 3.5,
362
+ "eval_accuracy": 0.738,
363
+ "eval_disk_space_total": 78.1898422241211,
364
+ "eval_disk_space_used": 26.468387603759766,
365
+ "eval_f1": 0.7334835535994888,
366
+ "eval_gpu_ram_allocated": 0.3935232162475586,
367
+ "eval_gpu_ram_cached": 16.05078125,
368
+ "eval_gpu_ram_total": 39.56402587890625,
369
+ "eval_gpu_utilization": 31,
370
+ "eval_loss": 0.84714674949646,
371
+ "eval_precision": 0.7326757628965238,
372
+ "eval_recall": 0.738,
373
+ "eval_runtime": 15.3571,
374
+ "eval_samples_per_second": 1302.33,
375
+ "eval_steps_per_second": 40.698,
376
+ "eval_system_ram_total": 83.48074722290039,
377
+ "eval_system_ram_used": 3.835094451904297,
378
+ "step": 8750
379
  }
380
  ],
381
  "max_steps": 12500,
382
  "num_train_epochs": 5,
383
+ "total_flos": 4574352934241664.0,
384
  "trial_name": null,
385
  "trial_params": null
386
  }
{checkpoint-8000 β†’ checkpoint-9000}/training_args.bin RENAMED
File without changes
{checkpoint-8000 β†’ checkpoint-9000}/vocab.txt RENAMED
File without changes
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d19e08ba096c383cb407dec2f4cecd928204b303f09a66a53ca72692cc9ce44
3
  size 133523761
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79f5061e5a30af545971dc68a923c602fdcaefe82abfb235cb7eb3cfc6f0461e
3
  size 133523761
runs/Jul23_01-08-06_df8adf32a670/events.out.tfevents.1690074496.df8adf32a670.1420.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04c5b433cdb9e1eccd5068c69d47c3726823edfdd4d7bc5d52c436d1954f52bb
3
- size 19208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:391f5f9f0ccddb11061193f1ce4a643a7a8ea6d38d9ce3a93250aa260c6e5b18
3
+ size 20310