AmberYifan commited on
Commit
6c81e27
·
verified ·
1 Parent(s): 7740585

Training in progress, step 310, checkpoint

Browse files
last-checkpoint/global_step310/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:548d0c8e93e0c471e5705dbbadd6a5c05bc4b5a0a9f6890bd5dd4cd8c443c33a
3
+ size 13476835648
last-checkpoint/global_step310/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fcf81f7763d28c21ac0a035c3f8910a9c68675635c88ba8e8fda0b8a22ab2d0
3
+ size 13476835648
last-checkpoint/global_step310/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ac9a85e921ce7b9ed72c131038ff1bb0c9e833d8c9640b2e5a83cb2164b5366
3
+ size 13476835648
last-checkpoint/global_step310/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a48b112b82d265c4a90ebd28aff54857341852a8d8e779aeb35b75ae4313c39a
3
+ size 13476835648
last-checkpoint/global_step310/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dfaccb97630865bfa96a9f8fc8e1eaac2f641bb5486f7f1b34ba82548d9a217
3
+ size 150693
last-checkpoint/global_step310/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c296a38893fbec54c8fb4c320b4ea180b982277ef291f058b5ffca0caf27bd2
3
+ size 150693
last-checkpoint/global_step310/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a19de9850756f925991116920eef332af9868426f05cf741786bffa261e1b51
3
+ size 150693
last-checkpoint/global_step310/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b775b848751a6b5c74313b60cd24e3e2d525b738411897a1a952fc106bb1799
3
+ size 150693
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step186
 
1
+ global_step310
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81392ca1341eff0062e670bf6bae66fb987670c5ea66d248165e16d5b2550583
3
  size 4938985352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30a7e1affffdf9c15def3843c5cfde483a104628598dfecba30ed1049b0a30c5
3
  size 4938985352
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1006a496ee196194e313e59321565ad7eb47f0dda4e314fd48d34709bd92ff82
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3c9d98753585457974806fe841e26db43d8bfe281fc8e6d20c96594f83a2b8b
3
  size 4947390880
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01d6dfe355522d2cd855421ed2ca07b299127e352ea22630b44c2a31747bb37c
3
  size 3590488816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:befe572e3ac32569b9d5d967b2c53d5c3a8e605e513126ccf8bfe7f95b20b4cd
3
  size 3590488816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50ca27603f7c4a4d9a980223e1a102922ac31561acfa7da4f28042e4e8b3528b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85a44fde7a8ca235658f035c0812d344f55779640520411739b17e214177e846
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c57f658c3d9b6de611da50021823095fc4067036fb9a4b34655cc2e34fbf5c2b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2caad91201b0df46e56af9eecef567ed2037350c38fdc81837724a4727d0b050
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:109da2c363a1e09432fa2ea2b7dceb6f67d1f91975069fc669e71dd536d654d8
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73e988587366c84fd1b4fc5931610543c6da84cf501cd98c78745fd102dd5024
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bda65e490958bfe3fe01157ed131eb2354f8fc19536842d27c998ecf29d48991
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55af3bb04c01d99df727583b8b7a09241b4e47d58ff1b9cf5532d3fa0d878b52
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4f13df3470221c87dbd73f49aa8200fcb840f387f1d9666c0df7b34d2fa99d1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deebfd046c912c12a5ec3992f182a7898d0a095fd57e8891bf19ccf9e61ba445
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5952,
5
  "eval_steps": 62,
6
- "global_step": 186,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -340,6 +340,233 @@
340
  "eval_samples_per_second": 8.273,
341
  "eval_steps_per_second": 0.538,
342
  "step": 186
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
343
  }
344
  ],
345
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.992,
5
  "eval_steps": 62,
6
+ "global_step": 310,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
340
  "eval_samples_per_second": 8.273,
341
  "eval_steps_per_second": 0.538,
342
  "step": 186
343
+ },
344
+ {
345
+ "epoch": 0.608,
346
+ "grad_norm": 16.658908982743004,
347
+ "learning_rate": 4.429928741092636e-07,
348
+ "logits/generated": -0.8416504859924316,
349
+ "logits/real": -0.7497158646583557,
350
+ "logps/generated": -139.05709838867188,
351
+ "logps/real": -148.94570922851562,
352
+ "loss": 0.7846,
353
+ "rewards/accuracies": 0.5874999761581421,
354
+ "rewards/generated": 2.1404006481170654,
355
+ "rewards/margins": 0.2006792575120926,
356
+ "rewards/real": 2.3410801887512207,
357
+ "step": 190
358
+ },
359
+ {
360
+ "epoch": 0.64,
361
+ "grad_norm": 18.49294211550667,
362
+ "learning_rate": 4.3705463182897863e-07,
363
+ "logits/generated": -0.8149245381355286,
364
+ "logits/real": -0.7733741402626038,
365
+ "logps/generated": -148.7723388671875,
366
+ "logps/real": -157.01002502441406,
367
+ "loss": 0.8195,
368
+ "rewards/accuracies": 0.6000000238418579,
369
+ "rewards/generated": 2.387281894683838,
370
+ "rewards/margins": 0.09757533669471741,
371
+ "rewards/real": 2.4848568439483643,
372
+ "step": 200
373
+ },
374
+ {
375
+ "epoch": 0.672,
376
+ "grad_norm": 17.59332234236512,
377
+ "learning_rate": 4.311163895486936e-07,
378
+ "logits/generated": -0.9455936551094055,
379
+ "logits/real": -0.8419392704963684,
380
+ "logps/generated": -127.24183654785156,
381
+ "logps/real": -152.42926025390625,
382
+ "loss": 0.8053,
383
+ "rewards/accuracies": 0.7250000238418579,
384
+ "rewards/generated": 2.3595032691955566,
385
+ "rewards/margins": 0.2850414216518402,
386
+ "rewards/real": 2.6445446014404297,
387
+ "step": 210
388
+ },
389
+ {
390
+ "epoch": 0.704,
391
+ "grad_norm": 19.24367698573702,
392
+ "learning_rate": 4.251781472684085e-07,
393
+ "logits/generated": -0.9183988571166992,
394
+ "logits/real": -0.8173867464065552,
395
+ "logps/generated": -139.09605407714844,
396
+ "logps/real": -148.06333923339844,
397
+ "loss": 0.7934,
398
+ "rewards/accuracies": 0.625,
399
+ "rewards/generated": 2.477370500564575,
400
+ "rewards/margins": 0.19253475964069366,
401
+ "rewards/real": 2.669905185699463,
402
+ "step": 220
403
+ },
404
+ {
405
+ "epoch": 0.736,
406
+ "grad_norm": 16.9276097355701,
407
+ "learning_rate": 4.192399049881235e-07,
408
+ "logits/generated": -0.8829792737960815,
409
+ "logits/real": -0.7381778955459595,
410
+ "logps/generated": -141.7750701904297,
411
+ "logps/real": -163.01681518554688,
412
+ "loss": 0.7719,
413
+ "rewards/accuracies": 0.675000011920929,
414
+ "rewards/generated": 2.4790730476379395,
415
+ "rewards/margins": 0.2519153952598572,
416
+ "rewards/real": 2.730988025665283,
417
+ "step": 230
418
+ },
419
+ {
420
+ "epoch": 0.768,
421
+ "grad_norm": 17.716708290599904,
422
+ "learning_rate": 4.1330166270783846e-07,
423
+ "logits/generated": -0.971518874168396,
424
+ "logits/real": -0.8174247741699219,
425
+ "logps/generated": -133.48629760742188,
426
+ "logps/real": -155.50323486328125,
427
+ "loss": 0.7916,
428
+ "rewards/accuracies": 0.7124999761581421,
429
+ "rewards/generated": 2.6949586868286133,
430
+ "rewards/margins": 0.36087772250175476,
431
+ "rewards/real": 3.0558362007141113,
432
+ "step": 240
433
+ },
434
+ {
435
+ "epoch": 0.7936,
436
+ "eval_logits/generated": -0.9049049615859985,
437
+ "eval_logits/real": -0.7322394847869873,
438
+ "eval_logps/generated": -133.84751892089844,
439
+ "eval_logps/real": -149.44224548339844,
440
+ "eval_loss": 0.7819451689720154,
441
+ "eval_rewards/accuracies": 0.6346153616905212,
442
+ "eval_rewards/generated": 2.8463921546936035,
443
+ "eval_rewards/margins": 0.1653067171573639,
444
+ "eval_rewards/real": 3.0116991996765137,
445
+ "eval_runtime": 32.5126,
446
+ "eval_samples_per_second": 6.151,
447
+ "eval_steps_per_second": 0.4,
448
+ "step": 248
449
+ },
450
+ {
451
+ "epoch": 0.8,
452
+ "grad_norm": 18.640457628639687,
453
+ "learning_rate": 4.0736342042755347e-07,
454
+ "logits/generated": -0.9556293487548828,
455
+ "logits/real": -0.8145408630371094,
456
+ "logps/generated": -131.24642944335938,
457
+ "logps/real": -151.69544982910156,
458
+ "loss": 0.7887,
459
+ "rewards/accuracies": 0.637499988079071,
460
+ "rewards/generated": 2.6524691581726074,
461
+ "rewards/margins": 0.29434913396835327,
462
+ "rewards/real": 2.9468178749084473,
463
+ "step": 250
464
+ },
465
+ {
466
+ "epoch": 0.832,
467
+ "grad_norm": 16.63118310118808,
468
+ "learning_rate": 4.0142517814726837e-07,
469
+ "logits/generated": -0.9603360891342163,
470
+ "logits/real": -0.8654125332832336,
471
+ "logps/generated": -131.46536254882812,
472
+ "logps/real": -145.35955810546875,
473
+ "loss": 0.745,
474
+ "rewards/accuracies": 0.75,
475
+ "rewards/generated": 2.698146343231201,
476
+ "rewards/margins": 0.3590725362300873,
477
+ "rewards/real": 3.0572190284729004,
478
+ "step": 260
479
+ },
480
+ {
481
+ "epoch": 0.864,
482
+ "grad_norm": 17.928869855327637,
483
+ "learning_rate": 3.9548693586698333e-07,
484
+ "logits/generated": -0.8567088842391968,
485
+ "logits/real": -0.8730006217956543,
486
+ "logps/generated": -141.62771606445312,
487
+ "logps/real": -148.68130493164062,
488
+ "loss": 0.7724,
489
+ "rewards/accuracies": 0.7124999761581421,
490
+ "rewards/generated": 2.8369460105895996,
491
+ "rewards/margins": 0.2711881995201111,
492
+ "rewards/real": 3.1081342697143555,
493
+ "step": 270
494
+ },
495
+ {
496
+ "epoch": 0.896,
497
+ "grad_norm": 20.71939027600533,
498
+ "learning_rate": 3.8954869358669834e-07,
499
+ "logits/generated": -0.9359349012374878,
500
+ "logits/real": -0.8951263427734375,
501
+ "logps/generated": -130.23509216308594,
502
+ "logps/real": -145.52688598632812,
503
+ "loss": 0.753,
504
+ "rewards/accuracies": 0.699999988079071,
505
+ "rewards/generated": 2.9565887451171875,
506
+ "rewards/margins": 0.2209053933620453,
507
+ "rewards/real": 3.1774942874908447,
508
+ "step": 280
509
+ },
510
+ {
511
+ "epoch": 0.928,
512
+ "grad_norm": 18.70808890126872,
513
+ "learning_rate": 3.836104513064133e-07,
514
+ "logits/generated": -0.9469617009162903,
515
+ "logits/real": -0.8130922317504883,
516
+ "logps/generated": -139.7478485107422,
517
+ "logps/real": -161.3312530517578,
518
+ "loss": 0.7894,
519
+ "rewards/accuracies": 0.675000011920929,
520
+ "rewards/generated": 3.0255463123321533,
521
+ "rewards/margins": 0.2867078185081482,
522
+ "rewards/real": 3.3122544288635254,
523
+ "step": 290
524
+ },
525
+ {
526
+ "epoch": 0.96,
527
+ "grad_norm": 17.486386337096317,
528
+ "learning_rate": 3.7767220902612825e-07,
529
+ "logits/generated": -1.0176459550857544,
530
+ "logits/real": -0.9189609289169312,
531
+ "logps/generated": -118.82048034667969,
532
+ "logps/real": -129.76571655273438,
533
+ "loss": 0.776,
534
+ "rewards/accuracies": 0.6499999761581421,
535
+ "rewards/generated": 3.0009846687316895,
536
+ "rewards/margins": 0.2632009983062744,
537
+ "rewards/real": 3.2641854286193848,
538
+ "step": 300
539
+ },
540
+ {
541
+ "epoch": 0.992,
542
+ "grad_norm": 19.447896698095892,
543
+ "learning_rate": 3.717339667458432e-07,
544
+ "logits/generated": -1.0006765127182007,
545
+ "logits/real": -0.8371036648750305,
546
+ "logps/generated": -124.53524017333984,
547
+ "logps/real": -153.3790740966797,
548
+ "loss": 0.7714,
549
+ "rewards/accuracies": 0.7250000238418579,
550
+ "rewards/generated": 3.1662862300872803,
551
+ "rewards/margins": 0.36638301610946655,
552
+ "rewards/real": 3.5326695442199707,
553
+ "step": 310
554
+ },
555
+ {
556
+ "epoch": 0.992,
557
+ "eval_logits/generated": -0.9510602951049805,
558
+ "eval_logits/real": -0.7904863357543945,
559
+ "eval_logps/generated": -130.37039184570312,
560
+ "eval_logps/real": -145.3455047607422,
561
+ "eval_loss": 0.7629792094230652,
562
+ "eval_rewards/accuracies": 0.6346153616905212,
563
+ "eval_rewards/generated": 3.1941020488739014,
564
+ "eval_rewards/margins": 0.2272697240114212,
565
+ "eval_rewards/real": 3.4213719367980957,
566
+ "eval_runtime": 24.7368,
567
+ "eval_samples_per_second": 8.085,
568
+ "eval_steps_per_second": 0.526,
569
+ "step": 310
570
  }
571
  ],
572
  "logging_steps": 10,