AmberYifan commited on
Commit
e511e34
·
verified ·
1 Parent(s): 69c533f

Training in progress, step 558, checkpoint

Browse files
last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b677f36c4dbba1597865689e743500347cf501cc6219466ae215b6987e26c4a
3
+ size 13476835648
last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd0ebda0c87e79dc3722e97a2df83ca342944de2a92d4bc676479aecc3b820d
3
+ size 13476835648
last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f9907c8908adefd6616ebf28806c3565f695ec1ecb08061a9d4d09788bf909d
3
+ size 13476835648
last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5f08ee6a4a2fed19229106f2679c8a3cb7920a4ac82776a9eb8c61e74ef154a
3
+ size 13476835648
last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4197fab2e1b6c27eb80b4a12b9a89a88edef0d3b3bc4098bec66af56ce12175
3
+ size 150693
last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78b498011d22d6099b99f0e237cd72ed3cc9140d37841de3cb31cf16841ffd25
3
+ size 150693
last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f4e0cdbc12c565dcf5572f41f7bcd3101a01a4f373e5c67c204ba7126453f93
3
+ size 150693
last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:305d0a1a20b6d3b7dde4970a8b61cc22630f0e88cc5cba0ed422e6061840955a
3
+ size 150693
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step434
 
1
+ global_step558
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a15bbb67da4b68beaed8d1f1dd43168748b208cf17aaf6f45a7686e7c1edbd9b
3
  size 4938985352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f57988b40ea7809dc08638e5caf7cc644808696ba431653d54751fa8e2ee7bef
3
  size 4938985352
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83c88deee3881a332b37ac27498efc573e8a8ef204fcce2dd84ce5b85ecd6313
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9637b70c600dc8d9de7c223cc42a2f547cec4117ec96d7971ad9596f125f6d4b
3
  size 4947390880
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb90a353cf0905ea79815177f94ace740d874bfb168850d0808801067ab6b160
3
  size 3590488816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57ab4e25910ea5f9e07b0b0aa8590e1bbbeec9b69fd598de221f66b43383d7c9
3
  size 3590488816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fe3f96a2fff0ebd8dbcc2b4789c9dd47a218358381d8dc0c22453d73cc18c13a
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb3d4793d6c7fda650513b6f3d24fe7afd643475a576b0104a85cb659ed441d3
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03c2e37b3b994a43a2c3a96dca7647061b052e8930abe99d16ea118bb9a4e2bc
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e44567105884943a8351ea71e9a71011cceee34a8f2a067be69948ea21390f49
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd2fb470636af306fe33bfa071a70c5e89bbc147a17ff3351e6d952861610b64
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c3a6f11c1c82a313f717b58d29d20267d0bfc621c79116ac6f752e0c1ba1f50
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42f403a555728d319355f2901e7ccab38b27c2ffdef1825aa77e363c48d96a77
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa97839e10563397740560600a86ccaf5a6fe1e5f41084453cab0f732a05570
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:765f176539e61f4c6bc8f2ad5d717ae2c3e0b0b105343abdeb194f4ded8a8b9b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:177a5448d699047d35d72636914adc373df5f511600959de3a1ed1ce15a52556
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.3888,
5
  "eval_steps": 62,
6
- "global_step": 434,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -779,6 +779,218 @@
779
  "eval_samples_per_second": 7.784,
780
  "eval_steps_per_second": 0.506,
781
  "step": 434
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
782
  }
783
  ],
784
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.7856,
5
  "eval_steps": 62,
6
+ "global_step": 558,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
779
  "eval_samples_per_second": 7.784,
780
  "eval_steps_per_second": 0.506,
781
  "step": 434
782
+ },
783
+ {
784
+ "epoch": 1.408,
785
+ "grad_norm": 0.35037689567096764,
786
+ "learning_rate": 2.9453681710213776e-07,
787
+ "logits/generated": -0.8212960362434387,
788
+ "logits/real": -1.3137534856796265,
789
+ "logps/generated": -355.6631774902344,
790
+ "logps/real": -114.98287200927734,
791
+ "loss": 0.1095,
792
+ "rewards/accuracies": 1.0,
793
+ "rewards/generated": -6.6356201171875,
794
+ "rewards/margins": 16.64114761352539,
795
+ "rewards/real": 10.00552749633789,
796
+ "step": 440
797
+ },
798
+ {
799
+ "epoch": 1.44,
800
+ "grad_norm": 0.36349550750442733,
801
+ "learning_rate": 2.885985748218527e-07,
802
+ "logits/generated": -0.8298400044441223,
803
+ "logits/real": -1.2980700731277466,
804
+ "logps/generated": -342.68341064453125,
805
+ "logps/real": -89.83566284179688,
806
+ "loss": 0.1046,
807
+ "rewards/accuracies": 1.0,
808
+ "rewards/generated": -6.842597961425781,
809
+ "rewards/margins": 15.478503227233887,
810
+ "rewards/real": 8.635905265808105,
811
+ "step": 450
812
+ },
813
+ {
814
+ "epoch": 1.472,
815
+ "grad_norm": 0.37277388095763225,
816
+ "learning_rate": 2.8266033254156767e-07,
817
+ "logits/generated": -0.891290009021759,
818
+ "logits/real": -1.394723653793335,
819
+ "logps/generated": -341.93218994140625,
820
+ "logps/real": -103.62208557128906,
821
+ "loss": 0.1079,
822
+ "rewards/accuracies": 1.0,
823
+ "rewards/generated": -6.340664863586426,
824
+ "rewards/margins": 15.834001541137695,
825
+ "rewards/real": 9.493334770202637,
826
+ "step": 460
827
+ },
828
+ {
829
+ "epoch": 1.504,
830
+ "grad_norm": 0.3303199018618516,
831
+ "learning_rate": 2.7672209026128263e-07,
832
+ "logits/generated": -0.8582679629325867,
833
+ "logits/real": -1.4615408182144165,
834
+ "logps/generated": -349.00909423828125,
835
+ "logps/real": -104.46484375,
836
+ "loss": 0.0966,
837
+ "rewards/accuracies": 1.0,
838
+ "rewards/generated": -6.171267986297607,
839
+ "rewards/margins": 16.01020622253418,
840
+ "rewards/real": 9.838939666748047,
841
+ "step": 470
842
+ },
843
+ {
844
+ "epoch": 1.536,
845
+ "grad_norm": 0.3813272818464241,
846
+ "learning_rate": 2.7078384798099764e-07,
847
+ "logits/generated": -0.8334212303161621,
848
+ "logits/real": -1.4117028713226318,
849
+ "logps/generated": -349.4712829589844,
850
+ "logps/real": -107.6310806274414,
851
+ "loss": 0.1069,
852
+ "rewards/accuracies": 1.0,
853
+ "rewards/generated": -6.388515472412109,
854
+ "rewards/margins": 16.422515869140625,
855
+ "rewards/real": 10.034002304077148,
856
+ "step": 480
857
+ },
858
+ {
859
+ "epoch": 1.568,
860
+ "grad_norm": 0.3427218965024406,
861
+ "learning_rate": 2.648456057007126e-07,
862
+ "logits/generated": -0.8402020335197449,
863
+ "logits/real": -1.3591063022613525,
864
+ "logps/generated": -349.86529541015625,
865
+ "logps/real": -102.61138916015625,
866
+ "loss": 0.1038,
867
+ "rewards/accuracies": 1.0,
868
+ "rewards/generated": -6.4038848876953125,
869
+ "rewards/margins": 16.043880462646484,
870
+ "rewards/real": 9.639993667602539,
871
+ "step": 490
872
+ },
873
+ {
874
+ "epoch": 1.5872000000000002,
875
+ "eval_logits/generated": -0.8754745125770569,
876
+ "eval_logits/real": -1.3614826202392578,
877
+ "eval_logps/generated": -352.7068786621094,
878
+ "eval_logps/real": -106.12812042236328,
879
+ "eval_loss": 0.10832550376653671,
880
+ "eval_rewards/accuracies": 1.0,
881
+ "eval_rewards/generated": -7.003779888153076,
882
+ "eval_rewards/margins": 17.076799392700195,
883
+ "eval_rewards/real": 10.07302188873291,
884
+ "eval_runtime": 33.3124,
885
+ "eval_samples_per_second": 6.004,
886
+ "eval_steps_per_second": 0.39,
887
+ "step": 496
888
+ },
889
+ {
890
+ "epoch": 1.6,
891
+ "grad_norm": 0.38914741214890197,
892
+ "learning_rate": 2.589073634204275e-07,
893
+ "logits/generated": -0.8448807597160339,
894
+ "logits/real": -1.3226372003555298,
895
+ "logps/generated": -351.1488037109375,
896
+ "logps/real": -107.77713775634766,
897
+ "loss": 0.1085,
898
+ "rewards/accuracies": 1.0,
899
+ "rewards/generated": -6.437747955322266,
900
+ "rewards/margins": 16.31161117553711,
901
+ "rewards/real": 9.87386417388916,
902
+ "step": 500
903
+ },
904
+ {
905
+ "epoch": 1.6320000000000001,
906
+ "grad_norm": 0.3937890384115947,
907
+ "learning_rate": 2.529691211401425e-07,
908
+ "logits/generated": -0.8879863619804382,
909
+ "logits/real": -1.3836486339569092,
910
+ "logps/generated": -340.003662109375,
911
+ "logps/real": -106.28749084472656,
912
+ "loss": 0.1051,
913
+ "rewards/accuracies": 1.0,
914
+ "rewards/generated": -6.393700122833252,
915
+ "rewards/margins": 16.35400390625,
916
+ "rewards/real": 9.960305213928223,
917
+ "step": 510
918
+ },
919
+ {
920
+ "epoch": 1.6640000000000001,
921
+ "grad_norm": 0.38541180062987296,
922
+ "learning_rate": 2.4703087885985747e-07,
923
+ "logits/generated": -0.8842099905014038,
924
+ "logits/real": -1.3454530239105225,
925
+ "logps/generated": -357.91693115234375,
926
+ "logps/real": -115.9624252319336,
927
+ "loss": 0.1108,
928
+ "rewards/accuracies": 1.0,
929
+ "rewards/generated": -7.042295932769775,
930
+ "rewards/margins": 17.503582000732422,
931
+ "rewards/real": 10.461287498474121,
932
+ "step": 520
933
+ },
934
+ {
935
+ "epoch": 1.696,
936
+ "grad_norm": 0.3409231189845364,
937
+ "learning_rate": 2.410926365795724e-07,
938
+ "logits/generated": -0.8585386276245117,
939
+ "logits/real": -1.3780685663223267,
940
+ "logps/generated": -352.55780029296875,
941
+ "logps/real": -104.75419616699219,
942
+ "loss": 0.1091,
943
+ "rewards/accuracies": 1.0,
944
+ "rewards/generated": -6.910445213317871,
945
+ "rewards/margins": 16.95829963684082,
946
+ "rewards/real": 10.047855377197266,
947
+ "step": 530
948
+ },
949
+ {
950
+ "epoch": 1.728,
951
+ "grad_norm": 0.36170229656289943,
952
+ "learning_rate": 2.351543942992874e-07,
953
+ "logits/generated": -0.8263759613037109,
954
+ "logits/real": -1.477992057800293,
955
+ "logps/generated": -342.4795227050781,
956
+ "logps/real": -107.40743255615234,
957
+ "loss": 0.1066,
958
+ "rewards/accuracies": 1.0,
959
+ "rewards/generated": -6.372612953186035,
960
+ "rewards/margins": 16.573341369628906,
961
+ "rewards/real": 10.200728416442871,
962
+ "step": 540
963
+ },
964
+ {
965
+ "epoch": 1.76,
966
+ "grad_norm": 0.3413340610553401,
967
+ "learning_rate": 2.2921615201900234e-07,
968
+ "logits/generated": -0.8356834650039673,
969
+ "logits/real": -1.391550898551941,
970
+ "logps/generated": -350.9759521484375,
971
+ "logps/real": -100.52735137939453,
972
+ "loss": 0.0996,
973
+ "rewards/accuracies": 1.0,
974
+ "rewards/generated": -6.971991539001465,
975
+ "rewards/margins": 16.87733268737793,
976
+ "rewards/real": 9.905343055725098,
977
+ "step": 550
978
+ },
979
+ {
980
+ "epoch": 1.7856,
981
+ "eval_logits/generated": -0.8467180728912354,
982
+ "eval_logits/real": -1.3430825471878052,
983
+ "eval_logps/generated": -352.8455810546875,
984
+ "eval_logps/real": -105.63909149169922,
985
+ "eval_loss": 0.10793981701135635,
986
+ "eval_rewards/accuracies": 1.0,
987
+ "eval_rewards/generated": -7.0176496505737305,
988
+ "eval_rewards/margins": 17.139570236206055,
989
+ "eval_rewards/real": 10.121922492980957,
990
+ "eval_runtime": 26.3578,
991
+ "eval_samples_per_second": 7.588,
992
+ "eval_steps_per_second": 0.493,
993
+ "step": 558
994
  }
995
  ],
996
  "logging_steps": 10,