hofarah commited on
Commit
f73ba9d
1 Parent(s): dc83601

Training in progress, step 360

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:717aeabd41162df58c589016e262864ca577bac403e982cd24e9397df8d808b9
3
  size 3545432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3786ba93365a1ee7b1ae5886a0f9a4c711aab7ed233d909a2f3d469512b6005f
3
  size 3545432
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af7dc2e0c6eac7de952444cda2f8a83b2d8ea1e3e332c7b71d88efa3373715d8
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9373701b4d3cd12bb97d502c54292e9ac07566346dda7a7d5485ed8c5163afc4
3
  size 1140034381
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b2ebb2a66011e7d1a3811ef684f1282f4aaec21ae4f3b25e3ee99eaee99d42d
3
  size 14511
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6203e50d371e7fa8a5f28de7e01da29302f09791f7fb1158a31d3b5b121115d0
3
  size 14511
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:964c2be91d4357cef5d0efd7d9436b648b6eb7a171890a57465951684d53da2f
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:083f1a4a1187ab20495ecc4456f9059e4e2102fc6106c30448967df2a7b52303
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.591919191919192,
5
- "global_step": 320,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -478,11 +478,70 @@
478
  "eval_samples_per_second": 0.054,
479
  "eval_steps_per_second": 0.028,
480
  "step": 320
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
481
  }
482
  ],
483
  "max_steps": 369,
484
  "num_train_epochs": 3,
485
- "total_flos": 1.248720939122688e+16,
486
  "trial_name": null,
487
  "trial_params": null
488
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.915151515151515,
5
+ "global_step": 360,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
478
  "eval_samples_per_second": 0.054,
479
  "eval_steps_per_second": 0.028,
480
  "step": 320
481
+ },
482
+ {
483
+ "epoch": 2.63,
484
+ "learning_rate": 6.368563685636857e-06,
485
+ "loss": 3.5124,
486
+ "step": 325
487
+ },
488
+ {
489
+ "epoch": 2.67,
490
+ "learning_rate": 5.6910569105691056e-06,
491
+ "loss": 3.128,
492
+ "step": 330
493
+ },
494
+ {
495
+ "epoch": 2.71,
496
+ "learning_rate": 5.013550135501355e-06,
497
+ "loss": 3.6112,
498
+ "step": 335
499
+ },
500
+ {
501
+ "epoch": 2.75,
502
+ "learning_rate": 4.336043360433605e-06,
503
+ "loss": 3.0695,
504
+ "step": 340
505
+ },
506
+ {
507
+ "epoch": 2.79,
508
+ "learning_rate": 3.6585365853658537e-06,
509
+ "loss": 3.4197,
510
+ "step": 345
511
+ },
512
+ {
513
+ "epoch": 2.83,
514
+ "learning_rate": 3.116531165311653e-06,
515
+ "loss": 3.2216,
516
+ "step": 350
517
+ },
518
+ {
519
+ "epoch": 2.87,
520
+ "learning_rate": 2.4390243902439027e-06,
521
+ "loss": 3.1863,
522
+ "step": 355
523
+ },
524
+ {
525
+ "epoch": 2.92,
526
+ "learning_rate": 1.7615176151761518e-06,
527
+ "loss": 3.3628,
528
+ "step": 360
529
+ },
530
+ {
531
+ "epoch": 2.92,
532
+ "eval_loss": 3.125962972640991,
533
+ "eval_rouge2_fmeasure": 0.0,
534
+ "eval_rouge2_precision": 0.0,
535
+ "eval_rouge2_recall": 0.0,
536
+ "eval_runtime": 439.7386,
537
+ "eval_samples_per_second": 0.061,
538
+ "eval_steps_per_second": 0.032,
539
+ "step": 360
540
  }
541
  ],
542
  "max_steps": 369,
543
  "num_train_epochs": 3,
544
+ "total_flos": 1.404811056513024e+16,
545
  "trial_name": null,
546
  "trial_params": null
547
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af7dc2e0c6eac7de952444cda2f8a83b2d8ea1e3e332c7b71d88efa3373715d8
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9373701b4d3cd12bb97d502c54292e9ac07566346dda7a7d5485ed8c5163afc4
3
  size 1140034381