YL95 commited on
Commit
970ab5d
1 Parent(s): c030334

training state at step 45

Browse files
Files changed (1) hide show
  1. trainer_state.json +63 -3
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5517241379310345,
5
  "eval_steps": 1,
6
- "global_step": 40,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -592,6 +592,66 @@
592
  "eval_samples_per_second": 1.137,
593
  "eval_steps_per_second": 0.569,
594
  "step": 39
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
595
  }
596
  ],
597
  "logging_steps": 1,
@@ -611,7 +671,7 @@
611
  "attributes": {}
612
  }
613
  },
614
- "total_flos": 5.112519916024627e+16,
615
  "train_batch_size": 2,
616
  "trial_name": null,
617
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.6206896551724138,
5
  "eval_steps": 1,
6
+ "global_step": 45,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
592
  "eval_samples_per_second": 1.137,
593
  "eval_steps_per_second": 0.569,
594
  "step": 39
595
+ },
596
+ {
597
+ "epoch": 0.5655172413793104,
598
+ "grad_norm": 2.2170450687408447,
599
+ "learning_rate": 2.2727272727272728e-06,
600
+ "loss": 1.316,
601
+ "step": 41
602
+ },
603
+ {
604
+ "epoch": 0.5655172413793104,
605
+ "eval_loss": 0.9163956642150879,
606
+ "eval_runtime": 15.7145,
607
+ "eval_samples_per_second": 1.273,
608
+ "eval_steps_per_second": 0.636,
609
+ "step": 41
610
+ },
611
+ {
612
+ "epoch": 0.5793103448275863,
613
+ "grad_norm": 2.2266974449157715,
614
+ "learning_rate": 4.5454545454545455e-06,
615
+ "loss": 1.3854,
616
+ "step": 42
617
+ },
618
+ {
619
+ "epoch": 0.5793103448275863,
620
+ "eval_loss": 0.9137259721755981,
621
+ "eval_runtime": 15.7133,
622
+ "eval_samples_per_second": 1.273,
623
+ "eval_steps_per_second": 0.636,
624
+ "step": 42
625
+ },
626
+ {
627
+ "epoch": 0.593103448275862,
628
+ "grad_norm": 2.3451268672943115,
629
+ "learning_rate": 6.818181818181818e-06,
630
+ "loss": 1.4208,
631
+ "step": 43
632
+ },
633
+ {
634
+ "epoch": 0.593103448275862,
635
+ "eval_loss": 0.9096618890762329,
636
+ "eval_runtime": 15.7895,
637
+ "eval_samples_per_second": 1.267,
638
+ "eval_steps_per_second": 0.633,
639
+ "step": 43
640
+ },
641
+ {
642
+ "epoch": 0.6068965517241379,
643
+ "grad_norm": 2.0125885009765625,
644
+ "learning_rate": 9.090909090909091e-06,
645
+ "loss": 1.4302,
646
+ "step": 44
647
+ },
648
+ {
649
+ "epoch": 0.6068965517241379,
650
+ "eval_loss": 0.9058458209037781,
651
+ "eval_runtime": 15.6899,
652
+ "eval_samples_per_second": 1.275,
653
+ "eval_steps_per_second": 0.637,
654
+ "step": 44
655
  }
656
  ],
657
  "logging_steps": 1,
 
671
  "attributes": {}
672
  }
673
  },
674
+ "total_flos": 5.643858048835584e+16,
675
  "train_batch_size": 2,
676
  "trial_name": null,
677
  "trial_params": null