tttx
/

PEFT
Safetensors
llama
alignment-handbook
trl
sft
Generated from Trainer
File size: 2,150 Bytes
f4a81c1
 
 
 
 
c08df0a
f4a81c1
 
 
 
 
c08df0a
1d11ba9
c08df0a
1d11ba9
f4a81c1
 
 
c08df0a
1d11ba9
c08df0a
1d11ba9
f4a81c1
 
 
c08df0a
1d11ba9
c08df0a
1d11ba9
f4a81c1
 
 
c08df0a
1d11ba9
c08df0a
1d11ba9
f4a81c1
 
 
c08df0a
1d11ba9
c08df0a
1d11ba9
f4a81c1
 
 
c08df0a
1d11ba9
c08df0a
1d11ba9
f4a81c1
 
 
 
1d11ba9
f4a81c1
1d11ba9
c08df0a
f4a81c1
 
 
1d11ba9
 
 
 
c08df0a
f4a81c1
 
 
c08df0a
 
1d11ba9
 
 
a439717
f4a81c1
 
 
c08df0a
f4a81c1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
c08df0a
 
f4a81c1
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 1.0,
  "eval_steps": 500,
  "global_step": 7,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.14285714285714285,
      "grad_norm": NaN,
      "learning_rate": 1e-05,
      "loss": 0.0,
      "step": 1
    },
    {
      "epoch": 0.2857142857142857,
      "grad_norm": NaN,
      "learning_rate": 9.330127018922195e-06,
      "loss": 0.0,
      "step": 2
    },
    {
      "epoch": 0.42857142857142855,
      "grad_norm": NaN,
      "learning_rate": 7.500000000000001e-06,
      "loss": 0.0,
      "step": 3
    },
    {
      "epoch": 0.5714285714285714,
      "grad_norm": NaN,
      "learning_rate": 5e-06,
      "loss": 0.0,
      "step": 4
    },
    {
      "epoch": 0.7142857142857143,
      "grad_norm": NaN,
      "learning_rate": 2.5000000000000015e-06,
      "loss": 0.0,
      "step": 5
    },
    {
      "epoch": 0.8571428571428571,
      "grad_norm": NaN,
      "learning_rate": 6.698729810778065e-07,
      "loss": 0.0,
      "step": 6
    },
    {
      "epoch": 1.0,
      "grad_norm": NaN,
      "learning_rate": 0.0,
      "loss": 0.0,
      "step": 7
    },
    {
      "epoch": 1.0,
      "eval_loss": NaN,
      "eval_runtime": 2.1348,
      "eval_samples_per_second": 0.468,
      "eval_steps_per_second": 0.468,
      "step": 7
    },
    {
      "epoch": 1.0,
      "step": 7,
      "total_flos": 54979878453248.0,
      "train_loss": 0.0,
      "train_runtime": 98.4374,
      "train_samples_per_second": 1.016,
      "train_steps_per_second": 0.071
    }
  ],
  "logging_steps": 1,
  "max_steps": 7,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 500,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": false,
        "should_training_stop": false
      },
      "attributes": {}
    }
  },
  "total_flos": 54979878453248.0,
  "train_batch_size": 2,
  "trial_name": null,
  "trial_params": null
}