Sai1212 commited on
Commit
017a401
·
1 Parent(s): 3f4eb3b

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
- "epoch": 2.0,
3
- "eval_accuracy": 0.5316455696202531,
4
- "eval_loss": 0.6931473612785339,
5
- "eval_runtime": 4.6123,
6
- "eval_samples_per_second": 17.128,
7
- "eval_steps_per_second": 0.65,
8
- "total_flos": 2.898785558237184e+16,
9
- "train_loss": 0.6919973691304525,
10
- "train_runtime": 76.6563,
11
- "train_samples_per_second": 7.24,
12
- "train_steps_per_second": 0.039
13
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.6075949367088608,
4
+ "eval_loss": 0.6998201608657837,
5
+ "eval_runtime": 4.8772,
6
+ "eval_samples_per_second": 16.198,
7
+ "eval_steps_per_second": 0.615,
8
+ "total_flos": 7.24696389559296e+16,
9
+ "train_loss": 0.6189225832621257,
10
+ "train_runtime": 239.3324,
11
+ "train_samples_per_second": 3.865,
12
+ "train_steps_per_second": 0.063
13
  }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "microsoft/swin-base-patch4-window7-224-in22k",
3
  "architectures": [
4
  "SwinForImageClassification"
5
  ],
 
1
  {
2
+ "_name_or_path": "microsoft/swin-base-patch4-window7-224",
3
  "architectures": [
4
  "SwinForImageClassification"
5
  ],
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.0,
3
- "eval_accuracy": 0.5316455696202531,
4
- "eval_loss": 0.6931473612785339,
5
- "eval_runtime": 4.6123,
6
- "eval_samples_per_second": 17.128,
7
- "eval_steps_per_second": 0.65
8
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "eval_accuracy": 0.6075949367088608,
4
+ "eval_loss": 0.6998201608657837,
5
+ "eval_runtime": 4.8772,
6
+ "eval_samples_per_second": 16.198,
7
+ "eval_steps_per_second": 0.615
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:363abce521002a977839e8351f62ccd2f073f9b8cf1d343ccff6f7c2289df88d
3
  size 347498816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df8adc4c51d350d67a55f0839f29ccdc4aa6512435637b5049feecea36a34232
3
  size 347498816
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 2.0,
3
- "total_flos": 2.898785558237184e+16,
4
- "train_loss": 0.6919973691304525,
5
- "train_runtime": 76.6563,
6
- "train_samples_per_second": 7.24,
7
- "train_steps_per_second": 0.039
8
  }
 
1
  {
2
+ "epoch": 5.0,
3
+ "total_flos": 7.24696389559296e+16,
4
+ "train_loss": 0.6189225832621257,
5
+ "train_runtime": 239.3324,
6
+ "train_samples_per_second": 3.865,
7
+ "train_steps_per_second": 0.063
8
  }
trainer_state.json CHANGED
@@ -1,47 +1,80 @@
1
  {
2
- "best_metric": 0.5316455696202531,
3
- "best_model_checkpoint": "swin-finetuned-food101\\checkpoint-1",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
- "global_step": 3,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.67,
13
- "eval_accuracy": 0.5316455696202531,
14
- "eval_loss": 0.6931473612785339,
15
- "eval_runtime": 5.5884,
16
- "eval_samples_per_second": 14.136,
17
- "eval_steps_per_second": 0.537,
18
- "step": 1
19
- },
20
- {
21
- "epoch": 2.0,
22
  "eval_accuracy": 0.46835443037974683,
23
- "eval_loss": 0.6949594020843506,
24
- "eval_runtime": 3.9224,
25
- "eval_samples_per_second": 20.141,
26
- "eval_steps_per_second": 0.765,
27
  "step": 3
28
  },
29
  {
30
  "epoch": 2.0,
31
- "step": 3,
32
- "total_flos": 2.898785558237184e+16,
33
- "train_loss": 0.6919973691304525,
34
- "train_runtime": 76.6563,
35
- "train_samples_per_second": 7.24,
36
- "train_steps_per_second": 0.039
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  }
38
  ],
39
  "logging_steps": 10,
40
- "max_steps": 3,
41
  "num_input_tokens_seen": 0,
42
- "num_train_epochs": 3,
43
  "save_steps": 500,
44
- "total_flos": 2.898785558237184e+16,
45
  "train_batch_size": 32,
46
  "trial_name": null,
47
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.6075949367088608,
3
+ "best_model_checkpoint": "swin-finetuned-food101\\checkpoint-12",
4
+ "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 15,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 1.0,
 
 
 
 
 
 
 
 
 
13
  "eval_accuracy": 0.46835443037974683,
14
+ "eval_loss": 0.709945797920227,
15
+ "eval_runtime": 4.7061,
16
+ "eval_samples_per_second": 16.787,
17
+ "eval_steps_per_second": 0.637,
18
  "step": 3
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_accuracy": 0.569620253164557,
23
+ "eval_loss": 0.7113380432128906,
24
+ "eval_runtime": 5.1386,
25
+ "eval_samples_per_second": 15.374,
26
+ "eval_steps_per_second": 0.584,
27
+ "step": 6
28
+ },
29
+ {
30
+ "epoch": 3.0,
31
+ "eval_accuracy": 0.4810126582278481,
32
+ "eval_loss": 0.8271049857139587,
33
+ "eval_runtime": 4.3712,
34
+ "eval_samples_per_second": 18.073,
35
+ "eval_steps_per_second": 0.686,
36
+ "step": 9
37
+ },
38
+ {
39
+ "epoch": 3.33,
40
+ "learning_rate": 7.142857142857143e-05,
41
+ "loss": 0.6561,
42
+ "step": 10
43
+ },
44
+ {
45
+ "epoch": 4.0,
46
+ "eval_accuracy": 0.6075949367088608,
47
+ "eval_loss": 0.6998201608657837,
48
+ "eval_runtime": 4.5439,
49
+ "eval_samples_per_second": 17.386,
50
+ "eval_steps_per_second": 0.66,
51
+ "step": 12
52
+ },
53
+ {
54
+ "epoch": 5.0,
55
+ "eval_accuracy": 0.5822784810126582,
56
+ "eval_loss": 0.8232901096343994,
57
+ "eval_runtime": 6.1137,
58
+ "eval_samples_per_second": 12.922,
59
+ "eval_steps_per_second": 0.491,
60
+ "step": 15
61
+ },
62
+ {
63
+ "epoch": 5.0,
64
+ "step": 15,
65
+ "total_flos": 7.24696389559296e+16,
66
+ "train_loss": 0.6189225832621257,
67
+ "train_runtime": 239.3324,
68
+ "train_samples_per_second": 3.865,
69
+ "train_steps_per_second": 0.063
70
  }
71
  ],
72
  "logging_steps": 10,
73
+ "max_steps": 15,
74
  "num_input_tokens_seen": 0,
75
+ "num_train_epochs": 5,
76
  "save_steps": 500,
77
+ "total_flos": 7.24696389559296e+16,
78
  "train_batch_size": 32,
79
  "trial_name": null,
80
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33a0d34bffcd583aa49a3ad059ebf6d6eeeb3d75e3117868411d5c74be66b67f
3
  size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35bc3aedffcd97a81146ac1708f5ec50be895ef7811e6fdf6a464670897316c1
3
  size 4728