AmberYifan commited on
Commit
1b6dd37
·
verified ·
1 Parent(s): 2bb2f92

Training in progress, step 682, checkpoint

Browse files
last-checkpoint/global_step682/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55f80e5ca4498a6afacf85917035d3dcc988f53b9feaabf778663aaccba6b721
3
+ size 13476835648
last-checkpoint/global_step682/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:443b40db32a9df9b8c04466ea32d23d3cd59cad3c3da46a5e43eb344b62d2663
3
+ size 13476835648
last-checkpoint/global_step682/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcab7beaccb2feaf666d5402a4654edd9638e9ff92675a724f9d117b70311711
3
+ size 13476835648
last-checkpoint/global_step682/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6cc330bd15d21cb4221f72aa24a69ad46e2caeed9d63481ebfb29145a2c4258
3
+ size 13476835648
last-checkpoint/global_step682/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5302e9f937abbdc558c1157c893863879a77d337dca79ef76dceb8aaa281769b
3
+ size 150693
last-checkpoint/global_step682/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:937de52210755d6f3f9a3465565f7a01685102749fbda3c0f183fd3a4833b14a
3
+ size 150693
last-checkpoint/global_step682/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8bd21fa8d9e5187765f0c614f77fb6ace6c3376c82b76ac9267bd63c2474011
3
+ size 150693
last-checkpoint/global_step682/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ee275be2f3515a14f6a8f95fa623c837a903f6a7c93edbd62bc7924fc37d264
3
+ size 150693
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step558
 
1
+ global_step682
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2eccfa1140badd2ba7d268833cb25515f4786a3a376ec7a70189454ca431a110
3
  size 4938985352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a978966c84c5073af91b7b63fcf4ee120d2f612a3c19702ad91cee54a444f1d
3
  size 4938985352
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afe95f19ba0b1d4f787647f396ad33e86582154ac38970507e3c4115ffd80235
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:574fa029b596f19edcc30cc62efa2256b512251146943e1707cd1c2e84f45654
3
  size 4947390880
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df33b2ae5733ef2380bc3366fb815ee4c3945810dd8a329f5963184b58b41341
3
  size 3590488816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebfde8270b886bb919881b07ed48cb5f4211146e60b32c2f6e09b8a7659d326a
3
  size 3590488816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb3d4793d6c7fda650513b6f3d24fe7afd643475a576b0104a85cb659ed441d3
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4cf818939bfcb1de93c78e79be7390fcae46bb5c39166bd571b1f3a8b2cdeb3
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e44567105884943a8351ea71e9a71011cceee34a8f2a067be69948ea21390f49
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:408ca302fdad670605f637bd7faeea541858831c4f2318e3fca2d0d709c7b218
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c3a6f11c1c82a313f717b58d29d20267d0bfc621c79116ac6f752e0c1ba1f50
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df380dcd2c8305fefe9f4ba88e7536beb3b5e94d863ac6f29eae326ddfef0f32
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aaa97839e10563397740560600a86ccaf5a6fe1e5f41084453cab0f732a05570
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51f78c929d775d81c8dd9feb87fd329a39e895b5f8b1d2cdbede2cbd8b45f49e
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:177a5448d699047d35d72636914adc373df5f511600959de3a1ed1ce15a52556
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ec08ea6383804e8c05c7ff772c4aed53351dc10413de8f46c3a1998585e65c7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.7856,
5
  "eval_steps": 62,
6
- "global_step": 558,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -991,6 +991,233 @@
991
  "eval_samples_per_second": 7.965,
992
  "eval_steps_per_second": 0.518,
993
  "step": 558
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
994
  }
995
  ],
996
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.1824,
5
  "eval_steps": 62,
6
+ "global_step": 682,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
991
  "eval_samples_per_second": 7.965,
992
  "eval_steps_per_second": 0.518,
993
  "step": 558
994
+ },
995
+ {
996
+ "epoch": 1.792,
997
+ "grad_norm": 17.055206574176236,
998
+ "learning_rate": 2.2327790973871732e-07,
999
+ "logits/generated": -1.1320490837097168,
1000
+ "logits/real": -1.0232712030410767,
1001
+ "logps/generated": -108.29972839355469,
1002
+ "logps/real": -143.79483032226562,
1003
+ "loss": 0.6217,
1004
+ "rewards/accuracies": 0.7749999761581421,
1005
+ "rewards/generated": 4.6177520751953125,
1006
+ "rewards/margins": 0.7333224415779114,
1007
+ "rewards/real": 5.351074695587158,
1008
+ "step": 560
1009
+ },
1010
+ {
1011
+ "epoch": 1.8239999999999998,
1012
+ "grad_norm": 18.75593177030039,
1013
+ "learning_rate": 2.173396674584323e-07,
1014
+ "logits/generated": -1.0942531824111938,
1015
+ "logits/real": -1.0221080780029297,
1016
+ "logps/generated": -126.5128173828125,
1017
+ "logps/real": -147.83128356933594,
1018
+ "loss": 0.628,
1019
+ "rewards/accuracies": 0.75,
1020
+ "rewards/generated": 4.6154656410217285,
1021
+ "rewards/margins": 0.5910970568656921,
1022
+ "rewards/real": 5.206562042236328,
1023
+ "step": 570
1024
+ },
1025
+ {
1026
+ "epoch": 1.8559999999999999,
1027
+ "grad_norm": 15.179698342246535,
1028
+ "learning_rate": 2.1140142517814726e-07,
1029
+ "logits/generated": -1.145850419998169,
1030
+ "logits/real": -1.0870602130889893,
1031
+ "logps/generated": -124.73545837402344,
1032
+ "logps/real": -121.8907241821289,
1033
+ "loss": 0.613,
1034
+ "rewards/accuracies": 0.824999988079071,
1035
+ "rewards/generated": 4.415905952453613,
1036
+ "rewards/margins": 0.7593585252761841,
1037
+ "rewards/real": 5.17526388168335,
1038
+ "step": 580
1039
+ },
1040
+ {
1041
+ "epoch": 1.888,
1042
+ "grad_norm": 20.11987923040954,
1043
+ "learning_rate": 2.0546318289786222e-07,
1044
+ "logits/generated": -1.079153060913086,
1045
+ "logits/real": -1.0978190898895264,
1046
+ "logps/generated": -120.56886291503906,
1047
+ "logps/real": -108.95628356933594,
1048
+ "loss": 0.6076,
1049
+ "rewards/accuracies": 0.75,
1050
+ "rewards/generated": 4.58314323425293,
1051
+ "rewards/margins": 0.6490724086761475,
1052
+ "rewards/real": 5.232215404510498,
1053
+ "step": 590
1054
+ },
1055
+ {
1056
+ "epoch": 1.92,
1057
+ "grad_norm": 22.28453291915191,
1058
+ "learning_rate": 1.9952494061757718e-07,
1059
+ "logits/generated": -1.0883268117904663,
1060
+ "logits/real": -1.0104598999023438,
1061
+ "logps/generated": -109.8032455444336,
1062
+ "logps/real": -129.53585815429688,
1063
+ "loss": 0.639,
1064
+ "rewards/accuracies": 0.8500000238418579,
1065
+ "rewards/generated": 4.67579460144043,
1066
+ "rewards/margins": 0.6613373160362244,
1067
+ "rewards/real": 5.337131977081299,
1068
+ "step": 600
1069
+ },
1070
+ {
1071
+ "epoch": 1.952,
1072
+ "grad_norm": 18.154894899648834,
1073
+ "learning_rate": 1.9358669833729216e-07,
1074
+ "logits/generated": -1.0883982181549072,
1075
+ "logits/real": -0.9995349049568176,
1076
+ "logps/generated": -124.6942367553711,
1077
+ "logps/real": -126.9339370727539,
1078
+ "loss": 0.5907,
1079
+ "rewards/accuracies": 0.824999988079071,
1080
+ "rewards/generated": 4.436325550079346,
1081
+ "rewards/margins": 0.8260261416435242,
1082
+ "rewards/real": 5.262351036071777,
1083
+ "step": 610
1084
+ },
1085
+ {
1086
+ "epoch": 1.984,
1087
+ "grad_norm": 22.624222827430785,
1088
+ "learning_rate": 1.876484560570071e-07,
1089
+ "logits/generated": -1.1425296068191528,
1090
+ "logits/real": -1.0683505535125732,
1091
+ "logps/generated": -115.10726165771484,
1092
+ "logps/real": -122.61649322509766,
1093
+ "loss": 0.6319,
1094
+ "rewards/accuracies": 0.8500000238418579,
1095
+ "rewards/generated": 4.4069294929504395,
1096
+ "rewards/margins": 0.796606183052063,
1097
+ "rewards/real": 5.203535556793213,
1098
+ "step": 620
1099
+ },
1100
+ {
1101
+ "epoch": 1.984,
1102
+ "eval_logits/generated": -1.0952835083007812,
1103
+ "eval_logits/real": -0.9814900159835815,
1104
+ "eval_logps/generated": -113.74794006347656,
1105
+ "eval_logps/real": -126.97822570800781,
1106
+ "eval_loss": 0.7260343432426453,
1107
+ "eval_rewards/accuracies": 0.6538461446762085,
1108
+ "eval_rewards/generated": 4.856348037719727,
1109
+ "eval_rewards/margins": 0.40175163745880127,
1110
+ "eval_rewards/real": 5.258099555969238,
1111
+ "eval_runtime": 31.4663,
1112
+ "eval_samples_per_second": 6.356,
1113
+ "eval_steps_per_second": 0.413,
1114
+ "step": 620
1115
+ },
1116
+ {
1117
+ "epoch": 2.016,
1118
+ "grad_norm": 21.8297742721762,
1119
+ "learning_rate": 1.8171021377672207e-07,
1120
+ "logits/generated": -1.0807393789291382,
1121
+ "logits/real": -1.0395593643188477,
1122
+ "logps/generated": -123.9543228149414,
1123
+ "logps/real": -131.9915771484375,
1124
+ "loss": 0.6155,
1125
+ "rewards/accuracies": 0.737500011920929,
1126
+ "rewards/generated": 4.8203253746032715,
1127
+ "rewards/margins": 0.5333833694458008,
1128
+ "rewards/real": 5.353708267211914,
1129
+ "step": 630
1130
+ },
1131
+ {
1132
+ "epoch": 2.048,
1133
+ "grad_norm": 14.056807307298643,
1134
+ "learning_rate": 1.7577197149643706e-07,
1135
+ "logits/generated": -1.1339702606201172,
1136
+ "logits/real": -1.0805795192718506,
1137
+ "logps/generated": -113.33274841308594,
1138
+ "logps/real": -121.1234130859375,
1139
+ "loss": 0.5439,
1140
+ "rewards/accuracies": 0.7875000238418579,
1141
+ "rewards/generated": 4.565612316131592,
1142
+ "rewards/margins": 0.6994994878768921,
1143
+ "rewards/real": 5.265111923217773,
1144
+ "step": 640
1145
+ },
1146
+ {
1147
+ "epoch": 2.08,
1148
+ "grad_norm": 15.940128910395343,
1149
+ "learning_rate": 1.6983372921615202e-07,
1150
+ "logits/generated": -1.0800470113754272,
1151
+ "logits/real": -1.0633183717727661,
1152
+ "logps/generated": -126.89707946777344,
1153
+ "logps/real": -120.8414535522461,
1154
+ "loss": 0.5551,
1155
+ "rewards/accuracies": 0.862500011920929,
1156
+ "rewards/generated": 4.451112270355225,
1157
+ "rewards/margins": 0.9589512944221497,
1158
+ "rewards/real": 5.410063743591309,
1159
+ "step": 650
1160
+ },
1161
+ {
1162
+ "epoch": 2.112,
1163
+ "grad_norm": 16.37087659914088,
1164
+ "learning_rate": 1.6389548693586697e-07,
1165
+ "logits/generated": -1.104059100151062,
1166
+ "logits/real": -1.0841295719146729,
1167
+ "logps/generated": -122.7937240600586,
1168
+ "logps/real": -123.018310546875,
1169
+ "loss": 0.5626,
1170
+ "rewards/accuracies": 0.824999988079071,
1171
+ "rewards/generated": 4.682831764221191,
1172
+ "rewards/margins": 0.842903733253479,
1173
+ "rewards/real": 5.525734901428223,
1174
+ "step": 660
1175
+ },
1176
+ {
1177
+ "epoch": 2.144,
1178
+ "grad_norm": 15.627941589708502,
1179
+ "learning_rate": 1.5795724465558193e-07,
1180
+ "logits/generated": -1.115173101425171,
1181
+ "logits/real": -1.003942847251892,
1182
+ "logps/generated": -110.61991119384766,
1183
+ "logps/real": -134.18214416503906,
1184
+ "loss": 0.5613,
1185
+ "rewards/accuracies": 0.824999988079071,
1186
+ "rewards/generated": 4.422333717346191,
1187
+ "rewards/margins": 0.9263809323310852,
1188
+ "rewards/real": 5.348714351654053,
1189
+ "step": 670
1190
+ },
1191
+ {
1192
+ "epoch": 2.176,
1193
+ "grad_norm": 14.69563602095957,
1194
+ "learning_rate": 1.520190023752969e-07,
1195
+ "logits/generated": -1.0999215841293335,
1196
+ "logits/real": -1.0661911964416504,
1197
+ "logps/generated": -117.02237701416016,
1198
+ "logps/real": -120.48469543457031,
1199
+ "loss": 0.552,
1200
+ "rewards/accuracies": 0.875,
1201
+ "rewards/generated": 4.575113773345947,
1202
+ "rewards/margins": 0.8418020009994507,
1203
+ "rewards/real": 5.416914939880371,
1204
+ "step": 680
1205
+ },
1206
+ {
1207
+ "epoch": 2.1824,
1208
+ "eval_logits/generated": -1.1133226156234741,
1209
+ "eval_logits/real": -1.007174015045166,
1210
+ "eval_logps/generated": -112.93437957763672,
1211
+ "eval_logps/real": -126.08976745605469,
1212
+ "eval_loss": 0.7294743061065674,
1213
+ "eval_rewards/accuracies": 0.6730769276618958,
1214
+ "eval_rewards/generated": 4.937705039978027,
1215
+ "eval_rewards/margins": 0.40924108028411865,
1216
+ "eval_rewards/real": 5.346945762634277,
1217
+ "eval_runtime": 31.1538,
1218
+ "eval_samples_per_second": 6.42,
1219
+ "eval_steps_per_second": 0.417,
1220
+ "step": 682
1221
  }
1222
  ],
1223
  "logging_steps": 10,