Training in progress, step 558, checkpoint
Browse files- last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/model-00001-of-00003.safetensors +1 -1
- last-checkpoint/model-00002-of-00003.safetensors +1 -1
- last-checkpoint/model-00003-of-00003.safetensors +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +214 -2
last-checkpoint/global_step558/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b677f36c4dbba1597865689e743500347cf501cc6219466ae215b6987e26c4a
|
3 |
+
size 13476835648
|
last-checkpoint/global_step558/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fd0ebda0c87e79dc3722e97a2df83ca342944de2a92d4bc676479aecc3b820d
|
3 |
+
size 13476835648
|
last-checkpoint/global_step558/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f9907c8908adefd6616ebf28806c3565f695ec1ecb08061a9d4d09788bf909d
|
3 |
+
size 13476835648
|
last-checkpoint/global_step558/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5f08ee6a4a2fed19229106f2679c8a3cb7920a4ac82776a9eb8c61e74ef154a
|
3 |
+
size 13476835648
|
last-checkpoint/global_step558/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4197fab2e1b6c27eb80b4a12b9a89a88edef0d3b3bc4098bec66af56ce12175
|
3 |
+
size 150693
|
last-checkpoint/global_step558/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78b498011d22d6099b99f0e237cd72ed3cc9140d37841de3cb31cf16841ffd25
|
3 |
+
size 150693
|
last-checkpoint/global_step558/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f4e0cdbc12c565dcf5572f41f7bcd3101a01a4f373e5c67c204ba7126453f93
|
3 |
+
size 150693
|
last-checkpoint/global_step558/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:305d0a1a20b6d3b7dde4970a8b61cc22630f0e88cc5cba0ed422e6061840955a
|
3 |
+
size 150693
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step558
|
last-checkpoint/model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4938985352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f57988b40ea7809dc08638e5caf7cc644808696ba431653d54751fa8e2ee7bef
|
3 |
size 4938985352
|
last-checkpoint/model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4947390880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9637b70c600dc8d9de7c223cc42a2f547cec4117ec96d7971ad9596f125f6d4b
|
3 |
size 4947390880
|
last-checkpoint/model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3590488816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57ab4e25910ea5f9e07b0b0aa8590e1bbbeec9b69fd598de221f66b43383d7c9
|
3 |
size 3590488816
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb3d4793d6c7fda650513b6f3d24fe7afd643475a576b0104a85cb659ed441d3
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e44567105884943a8351ea71e9a71011cceee34a8f2a067be69948ea21390f49
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3a6f11c1c82a313f717b58d29d20267d0bfc621c79116ac6f752e0c1ba1f50
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aaa97839e10563397740560600a86ccaf5a6fe1e5f41084453cab0f732a05570
|
3 |
size 15024
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:177a5448d699047d35d72636914adc373df5f511600959de3a1ed1ce15a52556
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 1.
|
5 |
"eval_steps": 62,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -779,6 +779,218 @@
|
|
779 |
"eval_samples_per_second": 7.784,
|
780 |
"eval_steps_per_second": 0.506,
|
781 |
"step": 434
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
782 |
}
|
783 |
],
|
784 |
"logging_steps": 10,
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 1.7856,
|
5 |
"eval_steps": 62,
|
6 |
+
"global_step": 558,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
779 |
"eval_samples_per_second": 7.784,
|
780 |
"eval_steps_per_second": 0.506,
|
781 |
"step": 434
|
782 |
+
},
|
783 |
+
{
|
784 |
+
"epoch": 1.408,
|
785 |
+
"grad_norm": 0.35037689567096764,
|
786 |
+
"learning_rate": 2.9453681710213776e-07,
|
787 |
+
"logits/generated": -0.8212960362434387,
|
788 |
+
"logits/real": -1.3137534856796265,
|
789 |
+
"logps/generated": -355.6631774902344,
|
790 |
+
"logps/real": -114.98287200927734,
|
791 |
+
"loss": 0.1095,
|
792 |
+
"rewards/accuracies": 1.0,
|
793 |
+
"rewards/generated": -6.6356201171875,
|
794 |
+
"rewards/margins": 16.64114761352539,
|
795 |
+
"rewards/real": 10.00552749633789,
|
796 |
+
"step": 440
|
797 |
+
},
|
798 |
+
{
|
799 |
+
"epoch": 1.44,
|
800 |
+
"grad_norm": 0.36349550750442733,
|
801 |
+
"learning_rate": 2.885985748218527e-07,
|
802 |
+
"logits/generated": -0.8298400044441223,
|
803 |
+
"logits/real": -1.2980700731277466,
|
804 |
+
"logps/generated": -342.68341064453125,
|
805 |
+
"logps/real": -89.83566284179688,
|
806 |
+
"loss": 0.1046,
|
807 |
+
"rewards/accuracies": 1.0,
|
808 |
+
"rewards/generated": -6.842597961425781,
|
809 |
+
"rewards/margins": 15.478503227233887,
|
810 |
+
"rewards/real": 8.635905265808105,
|
811 |
+
"step": 450
|
812 |
+
},
|
813 |
+
{
|
814 |
+
"epoch": 1.472,
|
815 |
+
"grad_norm": 0.37277388095763225,
|
816 |
+
"learning_rate": 2.8266033254156767e-07,
|
817 |
+
"logits/generated": -0.891290009021759,
|
818 |
+
"logits/real": -1.394723653793335,
|
819 |
+
"logps/generated": -341.93218994140625,
|
820 |
+
"logps/real": -103.62208557128906,
|
821 |
+
"loss": 0.1079,
|
822 |
+
"rewards/accuracies": 1.0,
|
823 |
+
"rewards/generated": -6.340664863586426,
|
824 |
+
"rewards/margins": 15.834001541137695,
|
825 |
+
"rewards/real": 9.493334770202637,
|
826 |
+
"step": 460
|
827 |
+
},
|
828 |
+
{
|
829 |
+
"epoch": 1.504,
|
830 |
+
"grad_norm": 0.3303199018618516,
|
831 |
+
"learning_rate": 2.7672209026128263e-07,
|
832 |
+
"logits/generated": -0.8582679629325867,
|
833 |
+
"logits/real": -1.4615408182144165,
|
834 |
+
"logps/generated": -349.00909423828125,
|
835 |
+
"logps/real": -104.46484375,
|
836 |
+
"loss": 0.0966,
|
837 |
+
"rewards/accuracies": 1.0,
|
838 |
+
"rewards/generated": -6.171267986297607,
|
839 |
+
"rewards/margins": 16.01020622253418,
|
840 |
+
"rewards/real": 9.838939666748047,
|
841 |
+
"step": 470
|
842 |
+
},
|
843 |
+
{
|
844 |
+
"epoch": 1.536,
|
845 |
+
"grad_norm": 0.3813272818464241,
|
846 |
+
"learning_rate": 2.7078384798099764e-07,
|
847 |
+
"logits/generated": -0.8334212303161621,
|
848 |
+
"logits/real": -1.4117028713226318,
|
849 |
+
"logps/generated": -349.4712829589844,
|
850 |
+
"logps/real": -107.6310806274414,
|
851 |
+
"loss": 0.1069,
|
852 |
+
"rewards/accuracies": 1.0,
|
853 |
+
"rewards/generated": -6.388515472412109,
|
854 |
+
"rewards/margins": 16.422515869140625,
|
855 |
+
"rewards/real": 10.034002304077148,
|
856 |
+
"step": 480
|
857 |
+
},
|
858 |
+
{
|
859 |
+
"epoch": 1.568,
|
860 |
+
"grad_norm": 0.3427218965024406,
|
861 |
+
"learning_rate": 2.648456057007126e-07,
|
862 |
+
"logits/generated": -0.8402020335197449,
|
863 |
+
"logits/real": -1.3591063022613525,
|
864 |
+
"logps/generated": -349.86529541015625,
|
865 |
+
"logps/real": -102.61138916015625,
|
866 |
+
"loss": 0.1038,
|
867 |
+
"rewards/accuracies": 1.0,
|
868 |
+
"rewards/generated": -6.4038848876953125,
|
869 |
+
"rewards/margins": 16.043880462646484,
|
870 |
+
"rewards/real": 9.639993667602539,
|
871 |
+
"step": 490
|
872 |
+
},
|
873 |
+
{
|
874 |
+
"epoch": 1.5872000000000002,
|
875 |
+
"eval_logits/generated": -0.8754745125770569,
|
876 |
+
"eval_logits/real": -1.3614826202392578,
|
877 |
+
"eval_logps/generated": -352.7068786621094,
|
878 |
+
"eval_logps/real": -106.12812042236328,
|
879 |
+
"eval_loss": 0.10832550376653671,
|
880 |
+
"eval_rewards/accuracies": 1.0,
|
881 |
+
"eval_rewards/generated": -7.003779888153076,
|
882 |
+
"eval_rewards/margins": 17.076799392700195,
|
883 |
+
"eval_rewards/real": 10.07302188873291,
|
884 |
+
"eval_runtime": 33.3124,
|
885 |
+
"eval_samples_per_second": 6.004,
|
886 |
+
"eval_steps_per_second": 0.39,
|
887 |
+
"step": 496
|
888 |
+
},
|
889 |
+
{
|
890 |
+
"epoch": 1.6,
|
891 |
+
"grad_norm": 0.38914741214890197,
|
892 |
+
"learning_rate": 2.589073634204275e-07,
|
893 |
+
"logits/generated": -0.8448807597160339,
|
894 |
+
"logits/real": -1.3226372003555298,
|
895 |
+
"logps/generated": -351.1488037109375,
|
896 |
+
"logps/real": -107.77713775634766,
|
897 |
+
"loss": 0.1085,
|
898 |
+
"rewards/accuracies": 1.0,
|
899 |
+
"rewards/generated": -6.437747955322266,
|
900 |
+
"rewards/margins": 16.31161117553711,
|
901 |
+
"rewards/real": 9.87386417388916,
|
902 |
+
"step": 500
|
903 |
+
},
|
904 |
+
{
|
905 |
+
"epoch": 1.6320000000000001,
|
906 |
+
"grad_norm": 0.3937890384115947,
|
907 |
+
"learning_rate": 2.529691211401425e-07,
|
908 |
+
"logits/generated": -0.8879863619804382,
|
909 |
+
"logits/real": -1.3836486339569092,
|
910 |
+
"logps/generated": -340.003662109375,
|
911 |
+
"logps/real": -106.28749084472656,
|
912 |
+
"loss": 0.1051,
|
913 |
+
"rewards/accuracies": 1.0,
|
914 |
+
"rewards/generated": -6.393700122833252,
|
915 |
+
"rewards/margins": 16.35400390625,
|
916 |
+
"rewards/real": 9.960305213928223,
|
917 |
+
"step": 510
|
918 |
+
},
|
919 |
+
{
|
920 |
+
"epoch": 1.6640000000000001,
|
921 |
+
"grad_norm": 0.38541180062987296,
|
922 |
+
"learning_rate": 2.4703087885985747e-07,
|
923 |
+
"logits/generated": -0.8842099905014038,
|
924 |
+
"logits/real": -1.3454530239105225,
|
925 |
+
"logps/generated": -357.91693115234375,
|
926 |
+
"logps/real": -115.9624252319336,
|
927 |
+
"loss": 0.1108,
|
928 |
+
"rewards/accuracies": 1.0,
|
929 |
+
"rewards/generated": -7.042295932769775,
|
930 |
+
"rewards/margins": 17.503582000732422,
|
931 |
+
"rewards/real": 10.461287498474121,
|
932 |
+
"step": 520
|
933 |
+
},
|
934 |
+
{
|
935 |
+
"epoch": 1.696,
|
936 |
+
"grad_norm": 0.3409231189845364,
|
937 |
+
"learning_rate": 2.410926365795724e-07,
|
938 |
+
"logits/generated": -0.8585386276245117,
|
939 |
+
"logits/real": -1.3780685663223267,
|
940 |
+
"logps/generated": -352.55780029296875,
|
941 |
+
"logps/real": -104.75419616699219,
|
942 |
+
"loss": 0.1091,
|
943 |
+
"rewards/accuracies": 1.0,
|
944 |
+
"rewards/generated": -6.910445213317871,
|
945 |
+
"rewards/margins": 16.95829963684082,
|
946 |
+
"rewards/real": 10.047855377197266,
|
947 |
+
"step": 530
|
948 |
+
},
|
949 |
+
{
|
950 |
+
"epoch": 1.728,
|
951 |
+
"grad_norm": 0.36170229656289943,
|
952 |
+
"learning_rate": 2.351543942992874e-07,
|
953 |
+
"logits/generated": -0.8263759613037109,
|
954 |
+
"logits/real": -1.477992057800293,
|
955 |
+
"logps/generated": -342.4795227050781,
|
956 |
+
"logps/real": -107.40743255615234,
|
957 |
+
"loss": 0.1066,
|
958 |
+
"rewards/accuracies": 1.0,
|
959 |
+
"rewards/generated": -6.372612953186035,
|
960 |
+
"rewards/margins": 16.573341369628906,
|
961 |
+
"rewards/real": 10.200728416442871,
|
962 |
+
"step": 540
|
963 |
+
},
|
964 |
+
{
|
965 |
+
"epoch": 1.76,
|
966 |
+
"grad_norm": 0.3413340610553401,
|
967 |
+
"learning_rate": 2.2921615201900234e-07,
|
968 |
+
"logits/generated": -0.8356834650039673,
|
969 |
+
"logits/real": -1.391550898551941,
|
970 |
+
"logps/generated": -350.9759521484375,
|
971 |
+
"logps/real": -100.52735137939453,
|
972 |
+
"loss": 0.0996,
|
973 |
+
"rewards/accuracies": 1.0,
|
974 |
+
"rewards/generated": -6.971991539001465,
|
975 |
+
"rewards/margins": 16.87733268737793,
|
976 |
+
"rewards/real": 9.905343055725098,
|
977 |
+
"step": 550
|
978 |
+
},
|
979 |
+
{
|
980 |
+
"epoch": 1.7856,
|
981 |
+
"eval_logits/generated": -0.8467180728912354,
|
982 |
+
"eval_logits/real": -1.3430825471878052,
|
983 |
+
"eval_logps/generated": -352.8455810546875,
|
984 |
+
"eval_logps/real": -105.63909149169922,
|
985 |
+
"eval_loss": 0.10793981701135635,
|
986 |
+
"eval_rewards/accuracies": 1.0,
|
987 |
+
"eval_rewards/generated": -7.0176496505737305,
|
988 |
+
"eval_rewards/margins": 17.139570236206055,
|
989 |
+
"eval_rewards/real": 10.121922492980957,
|
990 |
+
"eval_runtime": 26.3578,
|
991 |
+
"eval_samples_per_second": 7.588,
|
992 |
+
"eval_steps_per_second": 0.493,
|
993 |
+
"step": 558
|
994 |
}
|
995 |
],
|
996 |
"logging_steps": 10,
|