AmberYifan commited on
Commit
201977e
·
verified ·
1 Parent(s): 1da7693

Training in progress, step 310, checkpoint

Browse files
last-checkpoint/global_step310/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60f8137d4761f8c2bd9ab99f5be668bd702519ce7ac64c78eda8e3fc2620c25a
3
+ size 13476835648
last-checkpoint/global_step310/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85aaeb10b7115ba1c856de21eec3583959c79d28815cf8c670dca3b3f00c9bac
3
+ size 13476835648
last-checkpoint/global_step310/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d956dae0da7c7df185dd20bd6f860ce87327578ca48626be6aa1254f9468aab
3
+ size 13476835648
last-checkpoint/global_step310/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:448f39763b00dd35a0267adee83056d8b9b2e421836a35a5d3580a9a570c9075
3
+ size 13476835648
last-checkpoint/global_step310/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dfaccb97630865bfa96a9f8fc8e1eaac2f641bb5486f7f1b34ba82548d9a217
3
+ size 150693
last-checkpoint/global_step310/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c296a38893fbec54c8fb4c320b4ea180b982277ef291f058b5ffca0caf27bd2
3
+ size 150693
last-checkpoint/global_step310/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a19de9850756f925991116920eef332af9868426f05cf741786bffa261e1b51
3
+ size 150693
last-checkpoint/global_step310/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b775b848751a6b5c74313b60cd24e3e2d525b738411897a1a952fc106bb1799
3
+ size 150693
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step186
 
1
+ global_step310
last-checkpoint/model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:313d5167651e3868509dd3619ee1c2d07051385b98649993872036ea95d4aba0
3
  size 4938985352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7629983c481eb9200b556ac83ed8d209475fc4ef48f27d568a5cb34179c3b672
3
  size 4938985352
last-checkpoint/model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:845c39a62c9cb44d23ae87ad70b7d3a9dc92f88b09fb653b4375a2ca9ac136c3
3
  size 4947390880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7708922bcf1e99c851124c87b0ec55e1c4b40e5c0cea43b42302293a17729487
3
  size 4947390880
last-checkpoint/model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61a944543e23aed815241148692fce42317e0a4e455f648feb2320a8353247ad
3
  size 3590488816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44492addf0ff01b4318cdfbe27b38d73decff5f3a716bd9a106eee463d36f582
3
  size 3590488816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50ca27603f7c4a4d9a980223e1a102922ac31561acfa7da4f28042e4e8b3528b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85a44fde7a8ca235658f035c0812d344f55779640520411739b17e214177e846
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c57f658c3d9b6de611da50021823095fc4067036fb9a4b34655cc2e34fbf5c2b
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2caad91201b0df46e56af9eecef567ed2037350c38fdc81837724a4727d0b050
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:109da2c363a1e09432fa2ea2b7dceb6f67d1f91975069fc669e71dd536d654d8
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73e988587366c84fd1b4fc5931610543c6da84cf501cd98c78745fd102dd5024
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bda65e490958bfe3fe01157ed131eb2354f8fc19536842d27c998ecf29d48991
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55af3bb04c01d99df727583b8b7a09241b4e47d58ff1b9cf5532d3fa0d878b52
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4f13df3470221c87dbd73f49aa8200fcb840f387f1d9666c0df7b34d2fa99d1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deebfd046c912c12a5ec3992f182a7898d0a095fd57e8891bf19ccf9e61ba445
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5952,
5
  "eval_steps": 62,
6
- "global_step": 186,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -340,6 +340,233 @@
340
  "eval_samples_per_second": 7.758,
341
  "eval_steps_per_second": 0.504,
342
  "step": 186
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
343
  }
344
  ],
345
  "logging_steps": 10,
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.992,
5
  "eval_steps": 62,
6
+ "global_step": 310,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
340
  "eval_samples_per_second": 7.758,
341
  "eval_steps_per_second": 0.504,
342
  "step": 186
343
+ },
344
+ {
345
+ "epoch": 0.608,
346
+ "grad_norm": 0.39320789077558344,
347
+ "learning_rate": 4.429928741092636e-07,
348
+ "logits/generated": -0.8406023979187012,
349
+ "logits/real": -1.2843071222305298,
350
+ "logps/generated": -316.73291015625,
351
+ "logps/real": -109.3148193359375,
352
+ "loss": 0.1103,
353
+ "rewards/accuracies": 1.0,
354
+ "rewards/generated": -4.513542175292969,
355
+ "rewards/margins": 14.111068725585938,
356
+ "rewards/real": 9.597526550292969,
357
+ "step": 190
358
+ },
359
+ {
360
+ "epoch": 0.64,
361
+ "grad_norm": 0.34126559985788285,
362
+ "learning_rate": 4.3705463182897863e-07,
363
+ "logits/generated": -0.8079656362533569,
364
+ "logits/real": -1.2299845218658447,
365
+ "logps/generated": -333.931396484375,
366
+ "logps/real": -113.5406723022461,
367
+ "loss": 0.1079,
368
+ "rewards/accuracies": 1.0,
369
+ "rewards/generated": -5.271535873413086,
370
+ "rewards/margins": 14.859156608581543,
371
+ "rewards/real": 9.587618827819824,
372
+ "step": 200
373
+ },
374
+ {
375
+ "epoch": 0.672,
376
+ "grad_norm": 0.37211551392957165,
377
+ "learning_rate": 4.311163895486936e-07,
378
+ "logits/generated": -0.8258484601974487,
379
+ "logits/real": -1.2792431116104126,
380
+ "logps/generated": -326.34539794921875,
381
+ "logps/real": -110.4327621459961,
382
+ "loss": 0.1062,
383
+ "rewards/accuracies": 1.0,
384
+ "rewards/generated": -4.544249534606934,
385
+ "rewards/margins": 13.822877883911133,
386
+ "rewards/real": 9.278627395629883,
387
+ "step": 210
388
+ },
389
+ {
390
+ "epoch": 0.704,
391
+ "grad_norm": 0.40528624225351695,
392
+ "learning_rate": 4.251781472684085e-07,
393
+ "logits/generated": -0.9005807638168335,
394
+ "logits/real": -1.367760419845581,
395
+ "logps/generated": -334.90667724609375,
396
+ "logps/real": -108.89170837402344,
397
+ "loss": 0.1082,
398
+ "rewards/accuracies": 1.0,
399
+ "rewards/generated": -5.304292678833008,
400
+ "rewards/margins": 14.677830696105957,
401
+ "rewards/real": 9.37353801727295,
402
+ "step": 220
403
+ },
404
+ {
405
+ "epoch": 0.736,
406
+ "grad_norm": 0.4299824458037775,
407
+ "learning_rate": 4.192399049881235e-07,
408
+ "logits/generated": -0.871414065361023,
409
+ "logits/real": -1.2680821418762207,
410
+ "logps/generated": -327.0166015625,
411
+ "logps/real": -125.11517333984375,
412
+ "loss": 0.1201,
413
+ "rewards/accuracies": 1.0,
414
+ "rewards/generated": -5.102071285247803,
415
+ "rewards/margins": 15.333366394042969,
416
+ "rewards/real": 10.231294631958008,
417
+ "step": 230
418
+ },
419
+ {
420
+ "epoch": 0.768,
421
+ "grad_norm": 0.3200345894830024,
422
+ "learning_rate": 4.1330166270783846e-07,
423
+ "logits/generated": -0.8396976590156555,
424
+ "logits/real": -1.2651922702789307,
425
+ "logps/generated": -349.18804931640625,
426
+ "logps/real": -117.8864517211914,
427
+ "loss": 0.1094,
428
+ "rewards/accuracies": 1.0,
429
+ "rewards/generated": -5.743192672729492,
430
+ "rewards/margins": 15.722867965698242,
431
+ "rewards/real": 9.979674339294434,
432
+ "step": 240
433
+ },
434
+ {
435
+ "epoch": 0.7936,
436
+ "eval_logits/generated": -0.8538265228271484,
437
+ "eval_logits/real": -1.2560151815414429,
438
+ "eval_logps/generated": -337.5219421386719,
439
+ "eval_logps/real": -108.52310180664062,
440
+ "eval_loss": 0.11097312718629837,
441
+ "eval_rewards/accuracies": 1.0,
442
+ "eval_rewards/generated": -5.485285758972168,
443
+ "eval_rewards/margins": 15.318806648254395,
444
+ "eval_rewards/real": 9.83352279663086,
445
+ "eval_runtime": 32.0233,
446
+ "eval_samples_per_second": 6.245,
447
+ "eval_steps_per_second": 0.406,
448
+ "step": 248
449
+ },
450
+ {
451
+ "epoch": 0.8,
452
+ "grad_norm": 0.37657892572843127,
453
+ "learning_rate": 4.0736342042755347e-07,
454
+ "logits/generated": -0.8381448984146118,
455
+ "logits/real": -1.293889045715332,
456
+ "logps/generated": -344.9915466308594,
457
+ "logps/real": -111.15998840332031,
458
+ "loss": 0.1113,
459
+ "rewards/accuracies": 1.0,
460
+ "rewards/generated": -5.526784896850586,
461
+ "rewards/margins": 15.003395080566406,
462
+ "rewards/real": 9.476609230041504,
463
+ "step": 250
464
+ },
465
+ {
466
+ "epoch": 0.832,
467
+ "grad_norm": 0.3794924953311087,
468
+ "learning_rate": 4.0142517814726837e-07,
469
+ "logits/generated": -0.8616489171981812,
470
+ "logits/real": -1.342829704284668,
471
+ "logps/generated": -333.8689270019531,
472
+ "logps/real": -110.18806457519531,
473
+ "loss": 0.1068,
474
+ "rewards/accuracies": 1.0,
475
+ "rewards/generated": -5.346303939819336,
476
+ "rewards/margins": 15.174580574035645,
477
+ "rewards/real": 9.828276634216309,
478
+ "step": 260
479
+ },
480
+ {
481
+ "epoch": 0.864,
482
+ "grad_norm": 0.38432288454636715,
483
+ "learning_rate": 3.9548693586698333e-07,
484
+ "logits/generated": -0.8341599702835083,
485
+ "logits/real": -1.2853684425354004,
486
+ "logps/generated": -340.5439147949219,
487
+ "logps/real": -111.25767517089844,
488
+ "loss": 0.1119,
489
+ "rewards/accuracies": 1.0,
490
+ "rewards/generated": -5.1574320793151855,
491
+ "rewards/margins": 14.693034172058105,
492
+ "rewards/real": 9.535603523254395,
493
+ "step": 270
494
+ },
495
+ {
496
+ "epoch": 0.896,
497
+ "grad_norm": 0.4988860977100256,
498
+ "learning_rate": 3.8954869358669834e-07,
499
+ "logits/generated": -0.842201828956604,
500
+ "logits/real": -1.3558833599090576,
501
+ "logps/generated": -338.8299560546875,
502
+ "logps/real": -110.4022216796875,
503
+ "loss": 0.1111,
504
+ "rewards/accuracies": 1.0,
505
+ "rewards/generated": -5.072219371795654,
506
+ "rewards/margins": 14.635177612304688,
507
+ "rewards/real": 9.562958717346191,
508
+ "step": 280
509
+ },
510
+ {
511
+ "epoch": 0.928,
512
+ "grad_norm": 0.38841887432580663,
513
+ "learning_rate": 3.836104513064133e-07,
514
+ "logits/generated": -0.8865805864334106,
515
+ "logits/real": -1.2532027959823608,
516
+ "logps/generated": -338.3769226074219,
517
+ "logps/real": -120.43833923339844,
518
+ "loss": 0.1084,
519
+ "rewards/accuracies": 1.0,
520
+ "rewards/generated": -5.086993217468262,
521
+ "rewards/margins": 15.214749336242676,
522
+ "rewards/real": 10.127756118774414,
523
+ "step": 290
524
+ },
525
+ {
526
+ "epoch": 0.96,
527
+ "grad_norm": 0.3616732188669415,
528
+ "learning_rate": 3.7767220902612825e-07,
529
+ "logits/generated": -0.8655015826225281,
530
+ "logits/real": -1.3518953323364258,
531
+ "logps/generated": -325.9730529785156,
532
+ "logps/real": -95.09385681152344,
533
+ "loss": 0.1028,
534
+ "rewards/accuracies": 1.0,
535
+ "rewards/generated": -5.991705417633057,
536
+ "rewards/margins": 14.74760627746582,
537
+ "rewards/real": 8.755899429321289,
538
+ "step": 300
539
+ },
540
+ {
541
+ "epoch": 0.992,
542
+ "grad_norm": 0.39359159204366234,
543
+ "learning_rate": 3.717339667458432e-07,
544
+ "logits/generated": -0.8543545603752136,
545
+ "logits/real": -1.3398587703704834,
546
+ "logps/generated": -338.96466064453125,
547
+ "logps/real": -116.5450668334961,
548
+ "loss": 0.1115,
549
+ "rewards/accuracies": 1.0,
550
+ "rewards/generated": -5.719244480133057,
551
+ "rewards/margins": 15.74243450164795,
552
+ "rewards/real": 10.02319049835205,
553
+ "step": 310
554
+ },
555
+ {
556
+ "epoch": 0.992,
557
+ "eval_logits/generated": -0.865822434425354,
558
+ "eval_logits/real": -1.33043372631073,
559
+ "eval_logps/generated": -347.4965515136719,
560
+ "eval_logps/real": -107.73165130615234,
561
+ "eval_loss": 0.11000669747591019,
562
+ "eval_rewards/accuracies": 1.0,
563
+ "eval_rewards/generated": -6.482741832733154,
564
+ "eval_rewards/margins": 16.39541244506836,
565
+ "eval_rewards/real": 9.912667274475098,
566
+ "eval_runtime": 24.7895,
567
+ "eval_samples_per_second": 8.068,
568
+ "eval_steps_per_second": 0.524,
569
+ "step": 310
570
  }
571
  ],
572
  "logging_steps": 10,