Training in progress, step 558, checkpoint
Browse files- last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/model-00001-of-00003.safetensors +1 -1
- last-checkpoint/model-00002-of-00003.safetensors +1 -1
- last-checkpoint/model-00003-of-00003.safetensors +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +214 -2
last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a37984e3d0f9c1c5d696acc21cba3906de55edccf77e3023ecc511ee5e37b569
|
3 |
+
size 13476835648
|
last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f547832a81f42aeeafd49a1cc65d41d2df32e051e40157947704b9a1155238f
|
3 |
+
size 13476835648
|
last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95afb97a925bacac29c72a9d24ffb4d62ae6240a14503ab843da0140a5798bda
|
3 |
+
size 13476835648
|
last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1bbd294af0ad163e1633b47ceee6c37e2fa96c18f062607b44ebcfea885331c
|
3 |
+
size 13476835648
|
last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4197fab2e1b6c27eb80b4a12b9a89a88edef0d3b3bc4098bec66af56ce12175
|
3 |
+
size 150693
|
last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78b498011d22d6099b99f0e237cd72ed3cc9140d37841de3cb31cf16841ffd25
|
3 |
+
size 150693
|
last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f4e0cdbc12c565dcf5572f41f7bcd3101a01a4f373e5c67c204ba7126453f93
|
3 |
+
size 150693
|
last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:305d0a1a20b6d3b7dde4970a8b61cc22630f0e88cc5cba0ed422e6061840955a
|
3 |
+
size 150693
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step558
|
last-checkpoint/model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4938985352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2eccfa1140badd2ba7d268833cb25515f4786a3a376ec7a70189454ca431a110
|
3 |
size 4938985352
|
last-checkpoint/model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4947390880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afe95f19ba0b1d4f787647f396ad33e86582154ac38970507e3c4115ffd80235
|
3 |
size 4947390880
|
last-checkpoint/model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3590488816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df33b2ae5733ef2380bc3366fb815ee4c3945810dd8a329f5963184b58b41341
|
3 |
size 3590488816
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb3d4793d6c7fda650513b6f3d24fe7afd643475a576b0104a85cb659ed441d3
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e44567105884943a8351ea71e9a71011cceee34a8f2a067be69948ea21390f49
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3a6f11c1c82a313f717b58d29d20267d0bfc621c79116ac6f752e0c1ba1f50
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aaa97839e10563397740560600a86ccaf5a6fe1e5f41084453cab0f732a05570
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:177a5448d699047d35d72636914adc373df5f511600959de3a1ed1ce15a52556
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 1.
|
5 |
"eval_steps": 62,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -779,6 +779,218 @@
|
|
779 |
"eval_samples_per_second": 7.939,
|
780 |
"eval_steps_per_second": 0.516,
|
781 |
"step": 434
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
782 |
}
|
783 |
],
|
784 |
"logging_steps": 10,
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 1.7856,
|
5 |
"eval_steps": 62,
|
6 |
+
"global_step": 558,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
779 |
"eval_samples_per_second": 7.939,
|
780 |
"eval_steps_per_second": 0.516,
|
781 |
"step": 434
|
782 |
+
},
|
783 |
+
{
|
784 |
+
"epoch": 1.408,
|
785 |
+
"grad_norm": 16.14545407384991,
|
786 |
+
"learning_rate": 2.9453681710213776e-07,
|
787 |
+
"logits/generated": -0.9800319671630859,
|
788 |
+
"logits/real": -0.9277538061141968,
|
789 |
+
"logps/generated": -141.30862426757812,
|
790 |
+
"logps/real": -147.81869506835938,
|
791 |
+
"loss": 0.6465,
|
792 |
+
"rewards/accuracies": 0.762499988079071,
|
793 |
+
"rewards/generated": 3.95501971244812,
|
794 |
+
"rewards/margins": 0.6686196327209473,
|
795 |
+
"rewards/real": 4.6236395835876465,
|
796 |
+
"step": 440
|
797 |
+
},
|
798 |
+
{
|
799 |
+
"epoch": 1.44,
|
800 |
+
"grad_norm": 15.77508759846596,
|
801 |
+
"learning_rate": 2.885985748218527e-07,
|
802 |
+
"logits/generated": -1.066090703010559,
|
803 |
+
"logits/real": -0.9800545573234558,
|
804 |
+
"logps/generated": -118.1541748046875,
|
805 |
+
"logps/real": -114.2128677368164,
|
806 |
+
"loss": 0.6559,
|
807 |
+
"rewards/accuracies": 0.762499988079071,
|
808 |
+
"rewards/generated": 3.9932830333709717,
|
809 |
+
"rewards/margins": 0.5581256151199341,
|
810 |
+
"rewards/real": 4.5514092445373535,
|
811 |
+
"step": 450
|
812 |
+
},
|
813 |
+
{
|
814 |
+
"epoch": 1.472,
|
815 |
+
"grad_norm": 13.373472109654648,
|
816 |
+
"learning_rate": 2.8266033254156767e-07,
|
817 |
+
"logits/generated": -1.1050423383712769,
|
818 |
+
"logits/real": -1.059169888496399,
|
819 |
+
"logps/generated": -126.13043212890625,
|
820 |
+
"logps/real": -127.02229309082031,
|
821 |
+
"loss": 0.6429,
|
822 |
+
"rewards/accuracies": 0.7124999761581421,
|
823 |
+
"rewards/generated": 3.960355281829834,
|
824 |
+
"rewards/margins": 0.5283070206642151,
|
825 |
+
"rewards/real": 4.488662242889404,
|
826 |
+
"step": 460
|
827 |
+
},
|
828 |
+
{
|
829 |
+
"epoch": 1.504,
|
830 |
+
"grad_norm": 18.748026049573703,
|
831 |
+
"learning_rate": 2.7672209026128263e-07,
|
832 |
+
"logits/generated": -1.0380802154541016,
|
833 |
+
"logits/real": -1.0288408994674683,
|
834 |
+
"logps/generated": -124.66336822509766,
|
835 |
+
"logps/real": -129.6002197265625,
|
836 |
+
"loss": 0.631,
|
837 |
+
"rewards/accuracies": 0.762499988079071,
|
838 |
+
"rewards/generated": 4.066103458404541,
|
839 |
+
"rewards/margins": 0.5287829637527466,
|
840 |
+
"rewards/real": 4.59488582611084,
|
841 |
+
"step": 470
|
842 |
+
},
|
843 |
+
{
|
844 |
+
"epoch": 1.536,
|
845 |
+
"grad_norm": 18.771817584136546,
|
846 |
+
"learning_rate": 2.7078384798099764e-07,
|
847 |
+
"logits/generated": -1.030465841293335,
|
848 |
+
"logits/real": -1.0079973936080933,
|
849 |
+
"logps/generated": -110.46805572509766,
|
850 |
+
"logps/real": -130.38272094726562,
|
851 |
+
"loss": 0.6314,
|
852 |
+
"rewards/accuracies": 0.800000011920929,
|
853 |
+
"rewards/generated": 4.3078484535217285,
|
854 |
+
"rewards/margins": 0.575871467590332,
|
855 |
+
"rewards/real": 4.883719444274902,
|
856 |
+
"step": 480
|
857 |
+
},
|
858 |
+
{
|
859 |
+
"epoch": 1.568,
|
860 |
+
"grad_norm": 18.77488834205678,
|
861 |
+
"learning_rate": 2.648456057007126e-07,
|
862 |
+
"logits/generated": -1.0200045108795166,
|
863 |
+
"logits/real": -0.9613162875175476,
|
864 |
+
"logps/generated": -121.91667175292969,
|
865 |
+
"logps/real": -125.25045013427734,
|
866 |
+
"loss": 0.6575,
|
867 |
+
"rewards/accuracies": 0.800000011920929,
|
868 |
+
"rewards/generated": 4.19071626663208,
|
869 |
+
"rewards/margins": 0.5527010560035706,
|
870 |
+
"rewards/real": 4.743417263031006,
|
871 |
+
"step": 490
|
872 |
+
},
|
873 |
+
{
|
874 |
+
"epoch": 1.5872000000000002,
|
875 |
+
"eval_logits/generated": -1.0562151670455933,
|
876 |
+
"eval_logits/real": -0.9284681081771851,
|
877 |
+
"eval_logps/generated": -117.39347839355469,
|
878 |
+
"eval_logps/real": -131.05850219726562,
|
879 |
+
"eval_loss": 0.7352110147476196,
|
880 |
+
"eval_rewards/accuracies": 0.6538461446762085,
|
881 |
+
"eval_rewards/generated": 4.491795063018799,
|
882 |
+
"eval_rewards/margins": 0.3582780063152313,
|
883 |
+
"eval_rewards/real": 4.850072860717773,
|
884 |
+
"eval_runtime": 33.2476,
|
885 |
+
"eval_samples_per_second": 6.015,
|
886 |
+
"eval_steps_per_second": 0.391,
|
887 |
+
"step": 496
|
888 |
+
},
|
889 |
+
{
|
890 |
+
"epoch": 1.6,
|
891 |
+
"grad_norm": 16.35108797368165,
|
892 |
+
"learning_rate": 2.589073634204275e-07,
|
893 |
+
"logits/generated": -1.1007959842681885,
|
894 |
+
"logits/real": -1.0145621299743652,
|
895 |
+
"logps/generated": -118.1299057006836,
|
896 |
+
"logps/real": -132.48341369628906,
|
897 |
+
"loss": 0.6584,
|
898 |
+
"rewards/accuracies": 0.824999988079071,
|
899 |
+
"rewards/generated": 4.270500659942627,
|
900 |
+
"rewards/margins": 0.6508221626281738,
|
901 |
+
"rewards/real": 4.921322822570801,
|
902 |
+
"step": 500
|
903 |
+
},
|
904 |
+
{
|
905 |
+
"epoch": 1.6320000000000001,
|
906 |
+
"grad_norm": 18.24668534196415,
|
907 |
+
"learning_rate": 2.529691211401425e-07,
|
908 |
+
"logits/generated": -1.0347979068756104,
|
909 |
+
"logits/real": -1.0171585083007812,
|
910 |
+
"logps/generated": -134.5014190673828,
|
911 |
+
"logps/real": -128.9965362548828,
|
912 |
+
"loss": 0.6401,
|
913 |
+
"rewards/accuracies": 0.7749999761581421,
|
914 |
+
"rewards/generated": 4.300790309906006,
|
915 |
+
"rewards/margins": 0.6908756494522095,
|
916 |
+
"rewards/real": 4.991666316986084,
|
917 |
+
"step": 510
|
918 |
+
},
|
919 |
+
{
|
920 |
+
"epoch": 1.6640000000000001,
|
921 |
+
"grad_norm": 26.651414563625863,
|
922 |
+
"learning_rate": 2.4703087885985747e-07,
|
923 |
+
"logits/generated": -1.0487991571426392,
|
924 |
+
"logits/real": -0.9584493637084961,
|
925 |
+
"logps/generated": -112.0241928100586,
|
926 |
+
"logps/real": -135.36444091796875,
|
927 |
+
"loss": 0.6194,
|
928 |
+
"rewards/accuracies": 0.7749999761581421,
|
929 |
+
"rewards/generated": 4.406290531158447,
|
930 |
+
"rewards/margins": 0.6576591730117798,
|
931 |
+
"rewards/real": 5.0639495849609375,
|
932 |
+
"step": 520
|
933 |
+
},
|
934 |
+
{
|
935 |
+
"epoch": 1.696,
|
936 |
+
"grad_norm": 15.873503010462953,
|
937 |
+
"learning_rate": 2.410926365795724e-07,
|
938 |
+
"logits/generated": -1.0919219255447388,
|
939 |
+
"logits/real": -0.9894660115242004,
|
940 |
+
"logps/generated": -116.85237121582031,
|
941 |
+
"logps/real": -134.66482543945312,
|
942 |
+
"loss": 0.6307,
|
943 |
+
"rewards/accuracies": 0.7749999761581421,
|
944 |
+
"rewards/generated": 4.291749477386475,
|
945 |
+
"rewards/margins": 0.566550612449646,
|
946 |
+
"rewards/real": 4.85830020904541,
|
947 |
+
"step": 530
|
948 |
+
},
|
949 |
+
{
|
950 |
+
"epoch": 1.728,
|
951 |
+
"grad_norm": 18.65864238709199,
|
952 |
+
"learning_rate": 2.351543942992874e-07,
|
953 |
+
"logits/generated": -1.0818088054656982,
|
954 |
+
"logits/real": -1.0851285457611084,
|
955 |
+
"logps/generated": -121.41314697265625,
|
956 |
+
"logps/real": -126.65281677246094,
|
957 |
+
"loss": 0.6306,
|
958 |
+
"rewards/accuracies": 0.7749999761581421,
|
959 |
+
"rewards/generated": 4.241837978363037,
|
960 |
+
"rewards/margins": 0.7786606550216675,
|
961 |
+
"rewards/real": 5.020498752593994,
|
962 |
+
"step": 540
|
963 |
+
},
|
964 |
+
{
|
965 |
+
"epoch": 1.76,
|
966 |
+
"grad_norm": 16.985163916244147,
|
967 |
+
"learning_rate": 2.2921615201900234e-07,
|
968 |
+
"logits/generated": -1.0255613327026367,
|
969 |
+
"logits/real": -1.0782816410064697,
|
970 |
+
"logps/generated": -121.6998519897461,
|
971 |
+
"logps/real": -118.9133529663086,
|
972 |
+
"loss": 0.6606,
|
973 |
+
"rewards/accuracies": 0.6000000238418579,
|
974 |
+
"rewards/generated": 4.7306671142578125,
|
975 |
+
"rewards/margins": 0.3756607174873352,
|
976 |
+
"rewards/real": 5.106327533721924,
|
977 |
+
"step": 550
|
978 |
+
},
|
979 |
+
{
|
980 |
+
"epoch": 1.7856,
|
981 |
+
"eval_logits/generated": -1.0969022512435913,
|
982 |
+
"eval_logits/real": -0.9780063629150391,
|
983 |
+
"eval_logps/generated": -114.82669830322266,
|
984 |
+
"eval_logps/real": -128.44029235839844,
|
985 |
+
"eval_loss": 0.7269737720489502,
|
986 |
+
"eval_rewards/accuracies": 0.6538461446762085,
|
987 |
+
"eval_rewards/generated": 4.748473167419434,
|
988 |
+
"eval_rewards/margins": 0.36342188715934753,
|
989 |
+
"eval_rewards/real": 5.1118950843811035,
|
990 |
+
"eval_runtime": 25.1083,
|
991 |
+
"eval_samples_per_second": 7.965,
|
992 |
+
"eval_steps_per_second": 0.518,
|
993 |
+
"step": 558
|
994 |
}
|
995 |
],
|
996 |
"logging_steps": 10,
|