YL95 commited on
Commit
846754d
1 Parent(s): 4d9e75b

training state at step 70

Browse files
Files changed (1) hide show
  1. trainer_state.json +78 -3
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.896551724137931,
5
  "eval_steps": 1,
6
- "global_step": 65,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -937,6 +937,81 @@
937
  "eval_samples_per_second": 1.097,
938
  "eval_steps_per_second": 0.549,
939
  "step": 64
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
940
  }
941
  ],
942
  "logging_steps": 1,
@@ -956,7 +1031,7 @@
956
  "attributes": {}
957
  }
958
  },
959
- "total_flos": 8.144087573982413e+16,
960
  "train_batch_size": 2,
961
  "trial_name": null,
962
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9655172413793104,
5
  "eval_steps": 1,
6
+ "global_step": 70,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
937
  "eval_samples_per_second": 1.097,
938
  "eval_steps_per_second": 0.549,
939
  "step": 64
940
+ },
941
+ {
942
+ "epoch": 0.896551724137931,
943
+ "grad_norm": 1.9588886499404907,
944
+ "learning_rate": 2.272727272727273e-05,
945
+ "loss": 1.3699,
946
+ "step": 65
947
+ },
948
+ {
949
+ "epoch": 0.896551724137931,
950
+ "eval_loss": 0.8241379857063293,
951
+ "eval_runtime": 18.6162,
952
+ "eval_samples_per_second": 1.074,
953
+ "eval_steps_per_second": 0.537,
954
+ "step": 65
955
+ },
956
+ {
957
+ "epoch": 0.9103448275862069,
958
+ "grad_norm": 2.001984119415283,
959
+ "learning_rate": 2.5e-05,
960
+ "loss": 1.4399,
961
+ "step": 66
962
+ },
963
+ {
964
+ "epoch": 0.9103448275862069,
965
+ "eval_loss": 0.8220138549804688,
966
+ "eval_runtime": 18.4936,
967
+ "eval_samples_per_second": 1.081,
968
+ "eval_steps_per_second": 0.541,
969
+ "step": 66
970
+ },
971
+ {
972
+ "epoch": 0.9241379310344827,
973
+ "grad_norm": 1.9502840042114258,
974
+ "learning_rate": 2.7272727272727273e-05,
975
+ "loss": 1.1969,
976
+ "step": 67
977
+ },
978
+ {
979
+ "epoch": 0.9241379310344827,
980
+ "eval_loss": 0.8098680377006531,
981
+ "eval_runtime": 18.2406,
982
+ "eval_samples_per_second": 1.096,
983
+ "eval_steps_per_second": 0.548,
984
+ "step": 67
985
+ },
986
+ {
987
+ "epoch": 0.9379310344827586,
988
+ "grad_norm": 1.8572745323181152,
989
+ "learning_rate": 2.954545454545455e-05,
990
+ "loss": 1.1968,
991
+ "step": 68
992
+ },
993
+ {
994
+ "epoch": 0.9379310344827586,
995
+ "eval_loss": 0.7934565544128418,
996
+ "eval_runtime": 18.2457,
997
+ "eval_samples_per_second": 1.096,
998
+ "eval_steps_per_second": 0.548,
999
+ "step": 68
1000
+ },
1001
+ {
1002
+ "epoch": 0.9517241379310345,
1003
+ "grad_norm": 2.0354831218719482,
1004
+ "learning_rate": 3.181818181818182e-05,
1005
+ "loss": 1.2528,
1006
+ "step": 69
1007
+ },
1008
+ {
1009
+ "epoch": 0.9517241379310345,
1010
+ "eval_loss": 0.7829666137695312,
1011
+ "eval_runtime": 18.2217,
1012
+ "eval_samples_per_second": 1.098,
1013
+ "eval_steps_per_second": 0.549,
1014
+ "step": 69
1015
  }
1016
  ],
1017
  "logging_steps": 1,
 
1031
  "attributes": {}
1032
  }
1033
  },
1034
+ "total_flos": 8.799498944033587e+16,
1035
  "train_batch_size": 2,
1036
  "trial_name": null,
1037
  "trial_params": null