AmberYifan commited on
Commit
83ecac9
·
verified ·
1 Parent(s): 2517482

Training in progress, step 434, checkpoint

Browse files
last-checkpoint/global_step434/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d44d1d0c35af51487b3cd1bc18f6d735de17786eb0a9387a08df55aa918e062
3
+ size 13476835648
last-checkpoint/global_step434/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44ed82266ea6c62e3b2abeb15f6c726308f5858bd444d753435695d35af6b66d
3
+ size 13476835648
last-checkpoint/global_step434/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53438a552937f6ed18455d29745dfcbe301d674e0e05181f9f6fc92febe2c20d
3
+ size 13476835648
last-checkpoint/global_step434/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3ca81f745957762ea10705954cc29176be581d014eeb85848a6759c057d7611
3
+ size 13476835648
last-checkpoint/global_step434/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d602987ebf3bbae4f0a6d6b2015bd8e97c228dfcdff21db2dbe4a1394db07a8
3
+ size 150693
last-checkpoint/global_step434/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e424b63a80269c73a0353a46165784211ea81b0f904a22294880c6a6fb3ebfb5
3
+ size 150693
last-checkpoint/global_step434/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a0925e1e5e253ade9172f2400590391fb177d59d566ae875adab40cb4e467e3
3
+ size 150693
last-checkpoint/global_step434/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aacbe32e99222ebc853d9cf2162fb15cdb3156ad5ca97f518792b9c27a65d1d7
3
+ size 150693
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step310
 
1
+ global_step434
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7629983c481eb9200b556ac83ed8d209475fc4ef48f27d568a5cb34179c3b672
3
  size 4938985352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a15bbb67da4b68beaed8d1f1dd43168748b208cf17aaf6f45a7686e7c1edbd9b
3
  size 4938985352
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7708922bcf1e99c851124c87b0ec55e1c4b40e5c0cea43b42302293a17729487
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83c88deee3881a332b37ac27498efc573e8a8ef204fcce2dd84ce5b85ecd6313
3
  size 4947390880
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44492addf0ff01b4318cdfbe27b38d73decff5f3a716bd9a106eee463d36f582
3
  size 3590488816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb90a353cf0905ea79815177f94ace740d874bfb168850d0808801067ab6b160
3
  size 3590488816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85a44fde7a8ca235658f035c0812d344f55779640520411739b17e214177e846
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe3f96a2fff0ebd8dbcc2b4789c9dd47a218358381d8dc0c22453d73cc18c13a
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2caad91201b0df46e56af9eecef567ed2037350c38fdc81837724a4727d0b050
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03c2e37b3b994a43a2c3a96dca7647061b052e8930abe99d16ea118bb9a4e2bc
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73e988587366c84fd1b4fc5931610543c6da84cf501cd98c78745fd102dd5024
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd2fb470636af306fe33bfa071a70c5e89bbc147a17ff3351e6d952861610b64
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:55af3bb04c01d99df727583b8b7a09241b4e47d58ff1b9cf5532d3fa0d878b52
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42f403a555728d319355f2901e7ccab38b27c2ffdef1825aa77e363c48d96a77
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:deebfd046c912c12a5ec3992f182a7898d0a095fd57e8891bf19ccf9e61ba445
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:765f176539e61f4c6bc8f2ad5d717ae2c3e0b0b105343abdeb194f4ded8a8b9b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.992,
5
  "eval_steps": 62,
6
- "global_step": 310,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -567,6 +567,218 @@
567
  "eval_samples_per_second": 8.068,
568
  "eval_steps_per_second": 0.524,
569
  "step": 310
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
570
  }
571
  ],
572
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.3888,
5
  "eval_steps": 62,
6
+ "global_step": 434,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
567
  "eval_samples_per_second": 8.068,
568
  "eval_steps_per_second": 0.524,
569
  "step": 310
570
+ },
571
+ {
572
+ "epoch": 1.024,
573
+ "grad_norm": 0.39684443120667556,
574
+ "learning_rate": 3.6579572446555817e-07,
575
+ "logits/generated": -0.9057809710502625,
576
+ "logits/real": -1.3521413803100586,
577
+ "logps/generated": -349.14471435546875,
578
+ "logps/real": -111.87225341796875,
579
+ "loss": 0.1073,
580
+ "rewards/accuracies": 1.0,
581
+ "rewards/generated": -5.6079206466674805,
582
+ "rewards/margins": 15.645317077636719,
583
+ "rewards/real": 10.037394523620605,
584
+ "step": 320
585
+ },
586
+ {
587
+ "epoch": 1.056,
588
+ "grad_norm": 0.39872204323404287,
589
+ "learning_rate": 3.598574821852731e-07,
590
+ "logits/generated": -0.8963452577590942,
591
+ "logits/real": -1.4075753688812256,
592
+ "logps/generated": -350.3981018066406,
593
+ "logps/real": -111.39154052734375,
594
+ "loss": 0.1099,
595
+ "rewards/accuracies": 1.0,
596
+ "rewards/generated": -6.171029090881348,
597
+ "rewards/margins": 16.38304328918457,
598
+ "rewards/real": 10.212014198303223,
599
+ "step": 330
600
+ },
601
+ {
602
+ "epoch": 1.088,
603
+ "grad_norm": 0.3296521457207489,
604
+ "learning_rate": 3.5391923990498813e-07,
605
+ "logits/generated": -0.882519543170929,
606
+ "logits/real": -1.3683688640594482,
607
+ "logps/generated": -344.4193115234375,
608
+ "logps/real": -114.99576568603516,
609
+ "loss": 0.1121,
610
+ "rewards/accuracies": 1.0,
611
+ "rewards/generated": -6.464304447174072,
612
+ "rewards/margins": 16.844728469848633,
613
+ "rewards/real": 10.380424499511719,
614
+ "step": 340
615
+ },
616
+ {
617
+ "epoch": 1.12,
618
+ "grad_norm": 0.40794606558455315,
619
+ "learning_rate": 3.479809976247031e-07,
620
+ "logits/generated": -0.8548433184623718,
621
+ "logits/real": -1.33034086227417,
622
+ "logps/generated": -345.41497802734375,
623
+ "logps/real": -108.29139709472656,
624
+ "loss": 0.1084,
625
+ "rewards/accuracies": 1.0,
626
+ "rewards/generated": -5.70036506652832,
627
+ "rewards/margins": 15.80578899383545,
628
+ "rewards/real": 10.105424880981445,
629
+ "step": 350
630
+ },
631
+ {
632
+ "epoch": 1.152,
633
+ "grad_norm": 0.34179390042713315,
634
+ "learning_rate": 3.42042755344418e-07,
635
+ "logits/generated": -0.8854677081108093,
636
+ "logits/real": -1.3697372674942017,
637
+ "logps/generated": -349.7736511230469,
638
+ "logps/real": -117.81876373291016,
639
+ "loss": 0.1098,
640
+ "rewards/accuracies": 1.0,
641
+ "rewards/generated": -6.514307975769043,
642
+ "rewards/margins": 16.870037078857422,
643
+ "rewards/real": 10.355731010437012,
644
+ "step": 360
645
+ },
646
+ {
647
+ "epoch": 1.184,
648
+ "grad_norm": 0.38985325345599603,
649
+ "learning_rate": 3.36104513064133e-07,
650
+ "logits/generated": -0.8000022172927856,
651
+ "logits/real": -1.3874753713607788,
652
+ "logps/generated": -347.55010986328125,
653
+ "logps/real": -113.49405670166016,
654
+ "loss": 0.1046,
655
+ "rewards/accuracies": 1.0,
656
+ "rewards/generated": -6.464725494384766,
657
+ "rewards/margins": 16.653573989868164,
658
+ "rewards/real": 10.188849449157715,
659
+ "step": 370
660
+ },
661
+ {
662
+ "epoch": 1.1904,
663
+ "eval_logits/generated": -0.8655997514724731,
664
+ "eval_logits/real": -1.3632643222808838,
665
+ "eval_logps/generated": -349.3764953613281,
666
+ "eval_logps/real": -107.03945922851562,
667
+ "eval_loss": 0.10925532132387161,
668
+ "eval_rewards/accuracies": 1.0,
669
+ "eval_rewards/generated": -6.670737266540527,
670
+ "eval_rewards/margins": 16.652626037597656,
671
+ "eval_rewards/real": 9.981886863708496,
672
+ "eval_runtime": 35.169,
673
+ "eval_samples_per_second": 5.687,
674
+ "eval_steps_per_second": 0.37,
675
+ "step": 372
676
+ },
677
+ {
678
+ "epoch": 1.216,
679
+ "grad_norm": 0.3722532991523644,
680
+ "learning_rate": 3.3016627078384796e-07,
681
+ "logits/generated": -0.864538311958313,
682
+ "logits/real": -1.3105075359344482,
683
+ "logps/generated": -335.27362060546875,
684
+ "logps/real": -106.48799133300781,
685
+ "loss": 0.1035,
686
+ "rewards/accuracies": 1.0,
687
+ "rewards/generated": -6.397665977478027,
688
+ "rewards/margins": 16.154638290405273,
689
+ "rewards/real": 9.756973266601562,
690
+ "step": 380
691
+ },
692
+ {
693
+ "epoch": 1.248,
694
+ "grad_norm": 0.4038074067883792,
695
+ "learning_rate": 3.2422802850356297e-07,
696
+ "logits/generated": -0.8852449655532837,
697
+ "logits/real": -1.4460315704345703,
698
+ "logps/generated": -344.63311767578125,
699
+ "logps/real": -106.79902648925781,
700
+ "loss": 0.1027,
701
+ "rewards/accuracies": 1.0,
702
+ "rewards/generated": -5.748571395874023,
703
+ "rewards/margins": 15.521743774414062,
704
+ "rewards/real": 9.773170471191406,
705
+ "step": 390
706
+ },
707
+ {
708
+ "epoch": 1.28,
709
+ "grad_norm": 0.28676972353775737,
710
+ "learning_rate": 3.182897862232779e-07,
711
+ "logits/generated": -0.8121256828308105,
712
+ "logits/real": -1.354479432106018,
713
+ "logps/generated": -345.53326416015625,
714
+ "logps/real": -107.84037017822266,
715
+ "loss": 0.1003,
716
+ "rewards/accuracies": 1.0,
717
+ "rewards/generated": -6.011273384094238,
718
+ "rewards/margins": 15.705144882202148,
719
+ "rewards/real": 9.693869590759277,
720
+ "step": 400
721
+ },
722
+ {
723
+ "epoch": 1.312,
724
+ "grad_norm": 0.3326501083643602,
725
+ "learning_rate": 3.1235154394299283e-07,
726
+ "logits/generated": -0.8699803352355957,
727
+ "logits/real": -1.3926770687103271,
728
+ "logps/generated": -339.2923583984375,
729
+ "logps/real": -113.30909729003906,
730
+ "loss": 0.1069,
731
+ "rewards/accuracies": 1.0,
732
+ "rewards/generated": -5.364248275756836,
733
+ "rewards/margins": 15.17718505859375,
734
+ "rewards/real": 9.81293773651123,
735
+ "step": 410
736
+ },
737
+ {
738
+ "epoch": 1.3439999999999999,
739
+ "grad_norm": 0.41187476133988626,
740
+ "learning_rate": 3.0641330166270784e-07,
741
+ "logits/generated": -0.8451802134513855,
742
+ "logits/real": -1.3541207313537598,
743
+ "logps/generated": -344.1119384765625,
744
+ "logps/real": -99.13960266113281,
745
+ "loss": 0.103,
746
+ "rewards/accuracies": 1.0,
747
+ "rewards/generated": -6.0690155029296875,
748
+ "rewards/margins": 15.549135208129883,
749
+ "rewards/real": 9.480117797851562,
750
+ "step": 420
751
+ },
752
+ {
753
+ "epoch": 1.376,
754
+ "grad_norm": 0.37308896269833713,
755
+ "learning_rate": 3.004750593824228e-07,
756
+ "logits/generated": -0.8354321718215942,
757
+ "logits/real": -1.397528052330017,
758
+ "logps/generated": -354.12841796875,
759
+ "logps/real": -108.86185455322266,
760
+ "loss": 0.1067,
761
+ "rewards/accuracies": 1.0,
762
+ "rewards/generated": -6.957143306732178,
763
+ "rewards/margins": 16.80294418334961,
764
+ "rewards/real": 9.845802307128906,
765
+ "step": 430
766
+ },
767
+ {
768
+ "epoch": 1.3888,
769
+ "eval_logits/generated": -0.881392776966095,
770
+ "eval_logits/real": -1.3897513151168823,
771
+ "eval_logps/generated": -358.4093933105469,
772
+ "eval_logps/real": -106.73082733154297,
773
+ "eval_loss": 0.10892020910978317,
774
+ "eval_rewards/accuracies": 1.0,
775
+ "eval_rewards/generated": -7.574033260345459,
776
+ "eval_rewards/margins": 17.586782455444336,
777
+ "eval_rewards/real": 10.012747764587402,
778
+ "eval_runtime": 25.6933,
779
+ "eval_samples_per_second": 7.784,
780
+ "eval_steps_per_second": 0.506,
781
+ "step": 434
782
  }
783
  ],
784
  "logging_steps": 10,