pierreguillou commited on
Commit
b7ec3ce
1 Parent(s): 7419b6c

End of training

Browse files
checkpoint-1700/config.json DELETED
@@ -1,56 +0,0 @@
1
- {
2
- "_name_or_path": "nielsr/lilt-xlm-roberta-base",
3
- "architectures": [
4
- "LiltForTokenClassification"
5
- ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "bos_token_id": 0,
8
- "channel_shrink_ratio": 4,
9
- "classifier_dropout": null,
10
- "eos_token_id": 2,
11
- "hidden_act": "gelu",
12
- "hidden_dropout_prob": 0.1,
13
- "hidden_size": 768,
14
- "id2label": {
15
- "0": "Caption",
16
- "1": "Footnote",
17
- "2": "Formula",
18
- "3": "List-item",
19
- "4": "Page-footer",
20
- "5": "Page-header",
21
- "6": "Picture",
22
- "7": "Section-header",
23
- "8": "Table",
24
- "9": "Text",
25
- "10": "Title"
26
- },
27
- "initializer_range": 0.02,
28
- "intermediate_size": 3072,
29
- "label2id": {
30
- "Caption": 0,
31
- "Footnote": 1,
32
- "Formula": 2,
33
- "List-item": 3,
34
- "Page-footer": 4,
35
- "Page-header": 5,
36
- "Picture": 6,
37
- "Section-header": 7,
38
- "Table": 8,
39
- "Text": 9,
40
- "Title": 10
41
- },
42
- "layer_norm_eps": 1e-05,
43
- "max_2d_position_embeddings": 1024,
44
- "max_position_embeddings": 514,
45
- "model_type": "lilt",
46
- "num_attention_heads": 12,
47
- "num_hidden_layers": 12,
48
- "output_past": true,
49
- "pad_token_id": 1,
50
- "position_embedding_type": "absolute",
51
- "torch_dtype": "float32",
52
- "transformers_version": "4.26.1",
53
- "type_vocab_size": 1,
54
- "use_cache": true,
55
- "vocab_size": 250002
56
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-1700/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:729004fcf99456996b5021ebe5a947784fe395af38a311463a6c8394258a65e1
3
- size 2265828101
 
 
 
 
checkpoint-1700/pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:071823a09cad0d0ee1a84e696398cf09288e9b6d735bcc30cdd2d342f3f51d7b
3
- size 1134425553
 
 
 
 
checkpoint-1700/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:601d09199bbd913a7215c8cba0939124457c2a49e668a60ddf927eb5c0634883
3
- size 14575
 
 
 
 
checkpoint-1700/scaler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3bd9cd8c155d5657070f8ed265a80ce72d9d2060869298c24c5bdd0b74109812
3
- size 557
 
 
 
 
checkpoint-1700/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:52c3445de958aa8136571bb30deff20a540a52b3340cc380d53bac08e004773d
3
- size 627
 
 
 
 
checkpoint-1700/special_tokens_map.json DELETED
@@ -1,15 +0,0 @@
1
- {
2
- "bos_token": "<s>",
3
- "cls_token": "<s>",
4
- "eos_token": "</s>",
5
- "mask_token": {
6
- "content": "<mask>",
7
- "lstrip": true,
8
- "normalized": false,
9
- "rstrip": false,
10
- "single_word": false
11
- },
12
- "pad_token": "<pad>",
13
- "sep_token": "</s>",
14
- "unk_token": "<unk>"
15
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-1700/tokenizer.json DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:62c24cdc13d4c9952d63718d6c9fa4c287974249e16b7ade6d5a85e7bbb75626
3
- size 17082660
 
 
 
 
checkpoint-1700/tokenizer_config.json DELETED
@@ -1,20 +0,0 @@
1
- {
2
- "bos_token": "<s>",
3
- "cls_token": "<s>",
4
- "eos_token": "</s>",
5
- "mask_token": {
6
- "__type": "AddedToken",
7
- "content": "<mask>",
8
- "lstrip": true,
9
- "normalized": true,
10
- "rstrip": false,
11
- "single_word": false
12
- },
13
- "model_max_length": 512,
14
- "name_or_path": "nielsr/lilt-xlm-roberta-base",
15
- "pad_token": "<pad>",
16
- "sep_token": "</s>",
17
- "special_tokens_map_file": null,
18
- "tokenizer_class": "XLMRobertaTokenizer",
19
- "unk_token": "<unk>"
20
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-1700/trainer_state.json DELETED
@@ -1,238 +0,0 @@
1
- {
2
- "best_metric": 0.885723696687195,
3
- "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
4
- "epoch": 0.906183368869936,
5
- "global_step": 1700,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.05,
12
- "eval_accuracy": 0.6585185702735884,
13
- "eval_f1": 0.6585185702735884,
14
- "eval_loss": 0.9875321388244629,
15
- "eval_precision": 0.6585185702735884,
16
- "eval_recall": 0.6585185702735884,
17
- "eval_runtime": 47.6616,
18
- "eval_samples_per_second": 33.717,
19
- "eval_steps_per_second": 2.119,
20
- "step": 100
21
- },
22
- {
23
- "epoch": 0.11,
24
- "eval_accuracy": 0.7551279108067913,
25
- "eval_f1": 0.7551279108067913,
26
- "eval_loss": 0.7886354327201843,
27
- "eval_precision": 0.7551279108067913,
28
- "eval_recall": 0.7551279108067913,
29
- "eval_runtime": 48.4163,
30
- "eval_samples_per_second": 33.191,
31
- "eval_steps_per_second": 2.086,
32
- "step": 200
33
- },
34
- {
35
- "epoch": 0.16,
36
- "eval_accuracy": 0.8248275724395381,
37
- "eval_f1": 0.8248275724395382,
38
- "eval_loss": 0.5894176363945007,
39
- "eval_precision": 0.8248275724395381,
40
- "eval_recall": 0.8248275724395381,
41
- "eval_runtime": 47.5388,
42
- "eval_samples_per_second": 33.804,
43
- "eval_steps_per_second": 2.125,
44
- "step": 300
45
- },
46
- {
47
- "epoch": 0.21,
48
- "eval_accuracy": 0.839579985427251,
49
- "eval_f1": 0.8395799854272509,
50
- "eval_loss": 0.479428768157959,
51
- "eval_precision": 0.839579985427251,
52
- "eval_recall": 0.839579985427251,
53
- "eval_runtime": 45.3857,
54
- "eval_samples_per_second": 35.408,
55
- "eval_steps_per_second": 2.225,
56
- "step": 400
57
- },
58
- {
59
- "epoch": 0.27,
60
- "learning_rate": 1.4712153518123668e-05,
61
- "loss": 0.7446,
62
- "step": 500
63
- },
64
- {
65
- "epoch": 0.27,
66
- "eval_accuracy": 0.870342459600547,
67
- "eval_f1": 0.8703424596005469,
68
- "eval_loss": 0.39928165078163147,
69
- "eval_precision": 0.870342459600547,
70
- "eval_recall": 0.870342459600547,
71
- "eval_runtime": 46.3389,
72
- "eval_samples_per_second": 34.679,
73
- "eval_steps_per_second": 2.18,
74
- "step": 500
75
- },
76
- {
77
- "epoch": 0.32,
78
- "eval_accuracy": 0.885723696687195,
79
- "eval_f1": 0.885723696687195,
80
- "eval_loss": 0.36305829882621765,
81
- "eval_precision": 0.885723696687195,
82
- "eval_recall": 0.885723696687195,
83
- "eval_runtime": 46.9181,
84
- "eval_samples_per_second": 34.251,
85
- "eval_steps_per_second": 2.153,
86
- "step": 600
87
- },
88
- {
89
- "epoch": 0.37,
90
- "eval_accuracy": 0.8629662531066905,
91
- "eval_f1": 0.8629662531066905,
92
- "eval_loss": 0.4096183180809021,
93
- "eval_precision": 0.8629662531066905,
94
- "eval_recall": 0.8629662531066905,
95
- "eval_runtime": 45.8414,
96
- "eval_samples_per_second": 35.056,
97
- "eval_steps_per_second": 2.203,
98
- "step": 700
99
- },
100
- {
101
- "epoch": 0.43,
102
- "eval_accuracy": 0.8528252168445007,
103
- "eval_f1": 0.8528252168445007,
104
- "eval_loss": 0.44917240738868713,
105
- "eval_precision": 0.8528252168445007,
106
- "eval_recall": 0.8528252168445007,
107
- "eval_runtime": 45.6102,
108
- "eval_samples_per_second": 35.233,
109
- "eval_steps_per_second": 2.214,
110
- "step": 800
111
- },
112
- {
113
- "epoch": 0.48,
114
- "eval_accuracy": 0.8833980456546259,
115
- "eval_f1": 0.8833980456546259,
116
- "eval_loss": 0.38389313220977783,
117
- "eval_precision": 0.8833980456546259,
118
- "eval_recall": 0.8833980456546259,
119
- "eval_runtime": 47.6493,
120
- "eval_samples_per_second": 33.726,
121
- "eval_steps_per_second": 2.12,
122
- "step": 900
123
- },
124
- {
125
- "epoch": 0.53,
126
- "learning_rate": 9.381663113006397e-06,
127
- "loss": 0.4464,
128
- "step": 1000
129
- },
130
- {
131
- "epoch": 0.53,
132
- "eval_accuracy": 0.8498407977082855,
133
- "eval_f1": 0.8498407977082856,
134
- "eval_loss": 0.4365050792694092,
135
- "eval_precision": 0.8498407977082855,
136
- "eval_recall": 0.8498407977082855,
137
- "eval_runtime": 47.0078,
138
- "eval_samples_per_second": 34.186,
139
- "eval_steps_per_second": 2.149,
140
- "step": 1000
141
- },
142
- {
143
- "epoch": 0.59,
144
- "eval_accuracy": 0.8811622266361904,
145
- "eval_f1": 0.8811622266361904,
146
- "eval_loss": 0.36158204078674316,
147
- "eval_precision": 0.8811622266361904,
148
- "eval_recall": 0.8811622266361904,
149
- "eval_runtime": 44.8724,
150
- "eval_samples_per_second": 35.813,
151
- "eval_steps_per_second": 2.251,
152
- "step": 1100
153
- },
154
- {
155
- "epoch": 0.64,
156
- "eval_accuracy": 0.8795751943864972,
157
- "eval_f1": 0.8795751943864972,
158
- "eval_loss": 0.3948919177055359,
159
- "eval_precision": 0.8795751943864972,
160
- "eval_recall": 0.8795751943864972,
161
- "eval_runtime": 45.1224,
162
- "eval_samples_per_second": 35.614,
163
- "eval_steps_per_second": 2.238,
164
- "step": 1200
165
- },
166
- {
167
- "epoch": 0.69,
168
- "eval_accuracy": 0.8612794075079601,
169
- "eval_f1": 0.8612794075079601,
170
- "eval_loss": 0.41840043663978577,
171
- "eval_precision": 0.8612794075079601,
172
- "eval_recall": 0.8612794075079601,
173
- "eval_runtime": 39.7377,
174
- "eval_samples_per_second": 40.44,
175
- "eval_steps_per_second": 2.542,
176
- "step": 1300
177
- },
178
- {
179
- "epoch": 0.75,
180
- "eval_accuracy": 0.874334993562039,
181
- "eval_f1": 0.874334993562039,
182
- "eval_loss": 0.4129931926727295,
183
- "eval_precision": 0.874334993562039,
184
- "eval_recall": 0.874334993562039,
185
- "eval_runtime": 44.8477,
186
- "eval_samples_per_second": 35.832,
187
- "eval_steps_per_second": 2.252,
188
- "step": 1400
189
- },
190
- {
191
- "epoch": 0.8,
192
- "learning_rate": 4.051172707889126e-06,
193
- "loss": 0.3672,
194
- "step": 1500
195
- },
196
- {
197
- "epoch": 0.8,
198
- "eval_accuracy": 0.8288799944104525,
199
- "eval_f1": 0.8288799944104525,
200
- "eval_loss": 0.45351940393447876,
201
- "eval_precision": 0.8288799944104525,
202
- "eval_recall": 0.8288799944104525,
203
- "eval_runtime": 45.3573,
204
- "eval_samples_per_second": 35.43,
205
- "eval_steps_per_second": 2.227,
206
- "step": 1500
207
- },
208
- {
209
- "epoch": 0.85,
210
- "eval_accuracy": 0.8712607424116902,
211
- "eval_f1": 0.8712607424116902,
212
- "eval_loss": 0.36811864376068115,
213
- "eval_precision": 0.8712607424116902,
214
- "eval_recall": 0.8712607424116902,
215
- "eval_runtime": 44.3035,
216
- "eval_samples_per_second": 36.273,
217
- "eval_steps_per_second": 2.28,
218
- "step": 1600
219
- },
220
- {
221
- "epoch": 0.91,
222
- "eval_accuracy": 0.885723696687195,
223
- "eval_f1": 0.885723696687195,
224
- "eval_loss": 0.34459415078163147,
225
- "eval_precision": 0.885723696687195,
226
- "eval_recall": 0.885723696687195,
227
- "eval_runtime": 44.6077,
228
- "eval_samples_per_second": 36.025,
229
- "eval_steps_per_second": 2.264,
230
- "step": 1700
231
- }
232
- ],
233
- "max_steps": 1876,
234
- "num_train_epochs": 1,
235
- "total_flos": 3783142448332800.0,
236
- "trial_name": null,
237
- "trial_params": null
238
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-1700/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:575d482dfbe4b5795db81627b295d36a31851f66bb801524d15bc53043f733c4
3
- size 3707
 
 
 
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0ce50e2c3bc965514eb957251870b9e018aa89a1eb3c0b2d421e00f4020f51b
3
  size 1134425553
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d412db68cafdb004b544f6d25d7643b5e329556603ad90d82fa1115c4bc0a8c
3
  size 1134425553
runs/Feb15_07-53-26_e220f522c880/events.out.tfevents.1676447621.e220f522c880.495.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e10b4927301c942673e8c171300cc1481b2f2efdb1f5cf8e239edc99ad8f3db1
3
- size 13631
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:518feec74482da6cde3e3024307a9336fc4da2eb5db7da26cd3bbb4810be382c
3
+ size 13985