AmberYifan commited on
Commit
2bb2f92
·
verified ·
1 Parent(s): 2da7d03

Training in progress, step 558, checkpoint

Browse files
last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a37984e3d0f9c1c5d696acc21cba3906de55edccf77e3023ecc511ee5e37b569
3
+ size 13476835648
last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f547832a81f42aeeafd49a1cc65d41d2df32e051e40157947704b9a1155238f
3
+ size 13476835648
last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95afb97a925bacac29c72a9d24ffb4d62ae6240a14503ab843da0140a5798bda
3
+ size 13476835648
last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1bbd294af0ad163e1633b47ceee6c37e2fa96c18f062607b44ebcfea885331c
3
+ size 13476835648
last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4197fab2e1b6c27eb80b4a12b9a89a88edef0d3b3bc4098bec66af56ce12175
3
+ size 150693
last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78b498011d22d6099b99f0e237cd72ed3cc9140d37841de3cb31cf16841ffd25
3
+ size 150693
last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f4e0cdbc12c565dcf5572f41f7bcd3101a01a4f373e5c67c204ba7126453f93
3
+ size 150693
last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:305d0a1a20b6d3b7dde4970a8b61cc22630f0e88cc5cba0ed422e6061840955a
3
+ size 150693
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step434
 
1
+ global_step558
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2fef6470f7acc874fee3a68835c1e53f9e438740a72cbb8ea86cf21bc36d77b1
3
  size 4938985352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2eccfa1140badd2ba7d268833cb25515f4786a3a376ec7a70189454ca431a110
3
  size 4938985352
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7cc1149db49c837b4f2389db2c37feaa906d3adb3e8662e04df81300f5949c6
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afe95f19ba0b1d4f787647f396ad33e86582154ac38970507e3c4115ffd80235
3
  size 4947390880
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1ff4b2e559cf432ff17d10304f27ce70f3abfb9363d7c2dbc92b8260e596045
3
  size 3590488816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df33b2ae5733ef2380bc3366fb815ee4c3945810dd8a329f5963184b58b41341
3
  size 3590488816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe3f96a2fff0ebd8dbcc2b4789c9dd47a218358381d8dc0c22453d73cc18c13a
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb3d4793d6c7fda650513b6f3d24fe7afd643475a576b0104a85cb659ed441d3
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03c2e37b3b994a43a2c3a96dca7647061b052e8930abe99d16ea118bb9a4e2bc
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e44567105884943a8351ea71e9a71011cceee34a8f2a067be69948ea21390f49
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd2fb470636af306fe33bfa071a70c5e89bbc147a17ff3351e6d952861610b64
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c3a6f11c1c82a313f717b58d29d20267d0bfc621c79116ac6f752e0c1ba1f50
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42f403a555728d319355f2901e7ccab38b27c2ffdef1825aa77e363c48d96a77
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa97839e10563397740560600a86ccaf5a6fe1e5f41084453cab0f732a05570
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:765f176539e61f4c6bc8f2ad5d717ae2c3e0b0b105343abdeb194f4ded8a8b9b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:177a5448d699047d35d72636914adc373df5f511600959de3a1ed1ce15a52556
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.3888,
5
  "eval_steps": 62,
6
- "global_step": 434,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -779,6 +779,218 @@
779
  "eval_samples_per_second": 7.939,
780
  "eval_steps_per_second": 0.516,
781
  "step": 434
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
782
  }
783
  ],
784
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.7856,
5
  "eval_steps": 62,
6
+ "global_step": 558,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
779
  "eval_samples_per_second": 7.939,
780
  "eval_steps_per_second": 0.516,
781
  "step": 434
782
+ },
783
+ {
784
+ "epoch": 1.408,
785
+ "grad_norm": 16.14545407384991,
786
+ "learning_rate": 2.9453681710213776e-07,
787
+ "logits/generated": -0.9800319671630859,
788
+ "logits/real": -0.9277538061141968,
789
+ "logps/generated": -141.30862426757812,
790
+ "logps/real": -147.81869506835938,
791
+ "loss": 0.6465,
792
+ "rewards/accuracies": 0.762499988079071,
793
+ "rewards/generated": 3.95501971244812,
794
+ "rewards/margins": 0.6686196327209473,
795
+ "rewards/real": 4.6236395835876465,
796
+ "step": 440
797
+ },
798
+ {
799
+ "epoch": 1.44,
800
+ "grad_norm": 15.77508759846596,
801
+ "learning_rate": 2.885985748218527e-07,
802
+ "logits/generated": -1.066090703010559,
803
+ "logits/real": -0.9800545573234558,
804
+ "logps/generated": -118.1541748046875,
805
+ "logps/real": -114.2128677368164,
806
+ "loss": 0.6559,
807
+ "rewards/accuracies": 0.762499988079071,
808
+ "rewards/generated": 3.9932830333709717,
809
+ "rewards/margins": 0.5581256151199341,
810
+ "rewards/real": 4.5514092445373535,
811
+ "step": 450
812
+ },
813
+ {
814
+ "epoch": 1.472,
815
+ "grad_norm": 13.373472109654648,
816
+ "learning_rate": 2.8266033254156767e-07,
817
+ "logits/generated": -1.1050423383712769,
818
+ "logits/real": -1.059169888496399,
819
+ "logps/generated": -126.13043212890625,
820
+ "logps/real": -127.02229309082031,
821
+ "loss": 0.6429,
822
+ "rewards/accuracies": 0.7124999761581421,
823
+ "rewards/generated": 3.960355281829834,
824
+ "rewards/margins": 0.5283070206642151,
825
+ "rewards/real": 4.488662242889404,
826
+ "step": 460
827
+ },
828
+ {
829
+ "epoch": 1.504,
830
+ "grad_norm": 18.748026049573703,
831
+ "learning_rate": 2.7672209026128263e-07,
832
+ "logits/generated": -1.0380802154541016,
833
+ "logits/real": -1.0288408994674683,
834
+ "logps/generated": -124.66336822509766,
835
+ "logps/real": -129.6002197265625,
836
+ "loss": 0.631,
837
+ "rewards/accuracies": 0.762499988079071,
838
+ "rewards/generated": 4.066103458404541,
839
+ "rewards/margins": 0.5287829637527466,
840
+ "rewards/real": 4.59488582611084,
841
+ "step": 470
842
+ },
843
+ {
844
+ "epoch": 1.536,
845
+ "grad_norm": 18.771817584136546,
846
+ "learning_rate": 2.7078384798099764e-07,
847
+ "logits/generated": -1.030465841293335,
848
+ "logits/real": -1.0079973936080933,
849
+ "logps/generated": -110.46805572509766,
850
+ "logps/real": -130.38272094726562,
851
+ "loss": 0.6314,
852
+ "rewards/accuracies": 0.800000011920929,
853
+ "rewards/generated": 4.3078484535217285,
854
+ "rewards/margins": 0.575871467590332,
855
+ "rewards/real": 4.883719444274902,
856
+ "step": 480
857
+ },
858
+ {
859
+ "epoch": 1.568,
860
+ "grad_norm": 18.77488834205678,
861
+ "learning_rate": 2.648456057007126e-07,
862
+ "logits/generated": -1.0200045108795166,
863
+ "logits/real": -0.9613162875175476,
864
+ "logps/generated": -121.91667175292969,
865
+ "logps/real": -125.25045013427734,
866
+ "loss": 0.6575,
867
+ "rewards/accuracies": 0.800000011920929,
868
+ "rewards/generated": 4.19071626663208,
869
+ "rewards/margins": 0.5527010560035706,
870
+ "rewards/real": 4.743417263031006,
871
+ "step": 490
872
+ },
873
+ {
874
+ "epoch": 1.5872000000000002,
875
+ "eval_logits/generated": -1.0562151670455933,
876
+ "eval_logits/real": -0.9284681081771851,
877
+ "eval_logps/generated": -117.39347839355469,
878
+ "eval_logps/real": -131.05850219726562,
879
+ "eval_loss": 0.7352110147476196,
880
+ "eval_rewards/accuracies": 0.6538461446762085,
881
+ "eval_rewards/generated": 4.491795063018799,
882
+ "eval_rewards/margins": 0.3582780063152313,
883
+ "eval_rewards/real": 4.850072860717773,
884
+ "eval_runtime": 33.2476,
885
+ "eval_samples_per_second": 6.015,
886
+ "eval_steps_per_second": 0.391,
887
+ "step": 496
888
+ },
889
+ {
890
+ "epoch": 1.6,
891
+ "grad_norm": 16.35108797368165,
892
+ "learning_rate": 2.589073634204275e-07,
893
+ "logits/generated": -1.1007959842681885,
894
+ "logits/real": -1.0145621299743652,
895
+ "logps/generated": -118.1299057006836,
896
+ "logps/real": -132.48341369628906,
897
+ "loss": 0.6584,
898
+ "rewards/accuracies": 0.824999988079071,
899
+ "rewards/generated": 4.270500659942627,
900
+ "rewards/margins": 0.6508221626281738,
901
+ "rewards/real": 4.921322822570801,
902
+ "step": 500
903
+ },
904
+ {
905
+ "epoch": 1.6320000000000001,
906
+ "grad_norm": 18.24668534196415,
907
+ "learning_rate": 2.529691211401425e-07,
908
+ "logits/generated": -1.0347979068756104,
909
+ "logits/real": -1.0171585083007812,
910
+ "logps/generated": -134.5014190673828,
911
+ "logps/real": -128.9965362548828,
912
+ "loss": 0.6401,
913
+ "rewards/accuracies": 0.7749999761581421,
914
+ "rewards/generated": 4.300790309906006,
915
+ "rewards/margins": 0.6908756494522095,
916
+ "rewards/real": 4.991666316986084,
917
+ "step": 510
918
+ },
919
+ {
920
+ "epoch": 1.6640000000000001,
921
+ "grad_norm": 26.651414563625863,
922
+ "learning_rate": 2.4703087885985747e-07,
923
+ "logits/generated": -1.0487991571426392,
924
+ "logits/real": -0.9584493637084961,
925
+ "logps/generated": -112.0241928100586,
926
+ "logps/real": -135.36444091796875,
927
+ "loss": 0.6194,
928
+ "rewards/accuracies": 0.7749999761581421,
929
+ "rewards/generated": 4.406290531158447,
930
+ "rewards/margins": 0.6576591730117798,
931
+ "rewards/real": 5.0639495849609375,
932
+ "step": 520
933
+ },
934
+ {
935
+ "epoch": 1.696,
936
+ "grad_norm": 15.873503010462953,
937
+ "learning_rate": 2.410926365795724e-07,
938
+ "logits/generated": -1.0919219255447388,
939
+ "logits/real": -0.9894660115242004,
940
+ "logps/generated": -116.85237121582031,
941
+ "logps/real": -134.66482543945312,
942
+ "loss": 0.6307,
943
+ "rewards/accuracies": 0.7749999761581421,
944
+ "rewards/generated": 4.291749477386475,
945
+ "rewards/margins": 0.566550612449646,
946
+ "rewards/real": 4.85830020904541,
947
+ "step": 530
948
+ },
949
+ {
950
+ "epoch": 1.728,
951
+ "grad_norm": 18.65864238709199,
952
+ "learning_rate": 2.351543942992874e-07,
953
+ "logits/generated": -1.0818088054656982,
954
+ "logits/real": -1.0851285457611084,
955
+ "logps/generated": -121.41314697265625,
956
+ "logps/real": -126.65281677246094,
957
+ "loss": 0.6306,
958
+ "rewards/accuracies": 0.7749999761581421,
959
+ "rewards/generated": 4.241837978363037,
960
+ "rewards/margins": 0.7786606550216675,
961
+ "rewards/real": 5.020498752593994,
962
+ "step": 540
963
+ },
964
+ {
965
+ "epoch": 1.76,
966
+ "grad_norm": 16.985163916244147,
967
+ "learning_rate": 2.2921615201900234e-07,
968
+ "logits/generated": -1.0255613327026367,
969
+ "logits/real": -1.0782816410064697,
970
+ "logps/generated": -121.6998519897461,
971
+ "logps/real": -118.9133529663086,
972
+ "loss": 0.6606,
973
+ "rewards/accuracies": 0.6000000238418579,
974
+ "rewards/generated": 4.7306671142578125,
975
+ "rewards/margins": 0.3756607174873352,
976
+ "rewards/real": 5.106327533721924,
977
+ "step": 550
978
+ },
979
+ {
980
+ "epoch": 1.7856,
981
+ "eval_logits/generated": -1.0969022512435913,
982
+ "eval_logits/real": -0.9780063629150391,
983
+ "eval_logps/generated": -114.82669830322266,
984
+ "eval_logps/real": -128.44029235839844,
985
+ "eval_loss": 0.7269737720489502,
986
+ "eval_rewards/accuracies": 0.6538461446762085,
987
+ "eval_rewards/generated": 4.748473167419434,
988
+ "eval_rewards/margins": 0.36342188715934753,
989
+ "eval_rewards/real": 5.1118950843811035,
990
+ "eval_runtime": 25.1083,
991
+ "eval_samples_per_second": 7.965,
992
+ "eval_steps_per_second": 0.518,
993
+ "step": 558
994
  }
995
  ],
996
  "logging_steps": 10,