TimKond commited on
Commit
1840e63
·
1 Parent(s): ab0e2a3

initial commit

Browse files
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
all_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_f1": 0.9617271835132484,
4
+ "eval_loss": 0.11346353590488434,
5
+ "eval_runtime": 12.3823,
6
+ "eval_samples_per_second": 80.761,
7
+ "eval_steps_per_second": 10.095,
8
+ "train_loss": 0.20243481533847807,
9
+ "train_runtime": 2207.1281,
10
+ "train_samples_per_second": 24.466,
11
+ "train_steps_per_second": 0.765
12
+ }
config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "diffusion-detection",
3
+ "architectures": [
4
+ "BeitForImageClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "auxiliary_channels": 256,
8
+ "auxiliary_concat_input": false,
9
+ "auxiliary_loss_weight": 0.4,
10
+ "auxiliary_num_convs": 1,
11
+ "drop_path_rate": 0.1,
12
+ "hidden_act": "gelu",
13
+ "hidden_dropout_prob": 0.0,
14
+ "hidden_size": 768,
15
+ "id2label": {
16
+ "0": "negative",
17
+ "1": "positive"
18
+ },
19
+ "image_size": 224,
20
+ "initializer_range": 0.02,
21
+ "intermediate_size": 3072,
22
+ "label2id": {
23
+ "negative": "0",
24
+ "positive": "1"
25
+ },
26
+ "layer_norm_eps": 1e-12,
27
+ "layer_scale_init_value": 0.1,
28
+ "model_type": "beit",
29
+ "num_attention_heads": 12,
30
+ "num_channels": 3,
31
+ "num_hidden_layers": 12,
32
+ "out_indices": [
33
+ 3,
34
+ 5,
35
+ 7,
36
+ 11
37
+ ],
38
+ "patch_size": 16,
39
+ "pool_scales": [
40
+ 1,
41
+ 2,
42
+ 3,
43
+ 6
44
+ ],
45
+ "problem_type": "single_label_classification",
46
+ "semantic_loss_ignore_index": 255,
47
+ "torch_dtype": "float32",
48
+ "transformers_version": "4.29.2",
49
+ "use_absolute_position_embeddings": false,
50
+ "use_auxiliary_head": true,
51
+ "use_mask_token": true,
52
+ "use_mean_pooling": true,
53
+ "use_relative_position_bias": false,
54
+ "use_shared_relative_position_bias": true,
55
+ "vocab_size": 8192
56
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_f1": 0.9617271835132484,
4
+ "eval_loss": 0.11346353590488434,
5
+ "eval_runtime": 12.3823,
6
+ "eval_samples_per_second": 80.761,
7
+ "eval_steps_per_second": 10.095
8
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": false,
7
+ "do_normalize": true,
8
+ "do_reduce_labels": false,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "feature_extractor_type": "BeitFeatureExtractor",
12
+ "image_mean": [
13
+ 0.5,
14
+ 0.5,
15
+ 0.5
16
+ ],
17
+ "image_processor_type": "BeitImageProcessor",
18
+ "image_std": [
19
+ 0.5,
20
+ 0.5,
21
+ 0.5
22
+ ],
23
+ "resample": 2,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "height": 224,
27
+ "width": 224
28
+ }
29
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ca49ae14f393414cabd82707f498157a8a793e8cdedae766e6169edd54203b0
3
+ size 343051797
runs/Jun22_13-42-13_DESKTOP-3GG4RF1/1687434133.5090237/events.out.tfevents.1687434133.DESKTOP-3GG4RF1.16212.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d721d083565a790497d15f5ab3c97b32121d3984efdbc2b36c005e401ff0340c
3
+ size 5881
runs/Jun22_13-42-13_DESKTOP-3GG4RF1/events.out.tfevents.1687434133.DESKTOP-3GG4RF1.16212.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7c7e3567a2459ed732b97813dc4b97788e530a795db2709e2c1c324cee6e031
3
+ size 16291
runs/Jun22_13-42-13_DESKTOP-3GG4RF1/events.out.tfevents.1687436353.DESKTOP-3GG4RF1.16212.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35470df45ae1beb212aa0412e0b643e18947d6b952d809d239daf861b54e9c49
3
+ size 357
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "train_loss": 0.20243481533847807,
4
+ "train_runtime": 2207.1281,
5
+ "train_samples_per_second": 24.466,
6
+ "train_steps_per_second": 0.765
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,352 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
+ "global_step": 1689,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.0,
12
+ "learning_rate": 0.0002,
13
+ "loss": 0.7526,
14
+ "step": 1
15
+ },
16
+ {
17
+ "epoch": 0.09,
18
+ "eval_f1": 0.7867768595041322,
19
+ "eval_loss": 0.501287043094635,
20
+ "eval_runtime": 111.669,
21
+ "eval_samples_per_second": 8.955,
22
+ "eval_steps_per_second": 1.119,
23
+ "step": 48
24
+ },
25
+ {
26
+ "epoch": 0.17,
27
+ "eval_f1": 0.731527093596059,
28
+ "eval_loss": 0.45942792296409607,
29
+ "eval_runtime": 14.4836,
30
+ "eval_samples_per_second": 69.044,
31
+ "eval_steps_per_second": 8.63,
32
+ "step": 96
33
+ },
34
+ {
35
+ "epoch": 0.26,
36
+ "eval_f1": 0.768503937007874,
37
+ "eval_loss": 0.6004758477210999,
38
+ "eval_runtime": 13.7722,
39
+ "eval_samples_per_second": 72.61,
40
+ "eval_steps_per_second": 9.076,
41
+ "step": 144
42
+ },
43
+ {
44
+ "epoch": 0.34,
45
+ "eval_f1": 0.8773784355179703,
46
+ "eval_loss": 0.293561190366745,
47
+ "eval_runtime": 16.0256,
48
+ "eval_samples_per_second": 62.4,
49
+ "eval_steps_per_second": 7.8,
50
+ "step": 192
51
+ },
52
+ {
53
+ "epoch": 0.43,
54
+ "eval_f1": 0.8644444444444445,
55
+ "eval_loss": 0.3103949725627899,
56
+ "eval_runtime": 13.1537,
57
+ "eval_samples_per_second": 76.024,
58
+ "eval_steps_per_second": 9.503,
59
+ "step": 240
60
+ },
61
+ {
62
+ "epoch": 0.51,
63
+ "eval_f1": 0.903353057199211,
64
+ "eval_loss": 0.2314113825559616,
65
+ "eval_runtime": 13.9609,
66
+ "eval_samples_per_second": 71.629,
67
+ "eval_steps_per_second": 8.954,
68
+ "step": 288
69
+ },
70
+ {
71
+ "epoch": 0.6,
72
+ "eval_f1": 0.904950495049505,
73
+ "eval_loss": 0.23260511457920074,
74
+ "eval_runtime": 10.3047,
75
+ "eval_samples_per_second": 97.043,
76
+ "eval_steps_per_second": 12.13,
77
+ "step": 336
78
+ },
79
+ {
80
+ "epoch": 0.68,
81
+ "eval_f1": 0.8210526315789474,
82
+ "eval_loss": 0.39369526505470276,
83
+ "eval_runtime": 13.155,
84
+ "eval_samples_per_second": 76.017,
85
+ "eval_steps_per_second": 9.502,
86
+ "step": 384
87
+ },
88
+ {
89
+ "epoch": 0.77,
90
+ "eval_f1": 0.9147609147609148,
91
+ "eval_loss": 0.20550310611724854,
92
+ "eval_runtime": 45.6928,
93
+ "eval_samples_per_second": 21.885,
94
+ "eval_steps_per_second": 2.736,
95
+ "step": 432
96
+ },
97
+ {
98
+ "epoch": 0.85,
99
+ "eval_f1": 0.8367816091954022,
100
+ "eval_loss": 0.3017582893371582,
101
+ "eval_runtime": 22.6976,
102
+ "eval_samples_per_second": 44.057,
103
+ "eval_steps_per_second": 5.507,
104
+ "step": 480
105
+ },
106
+ {
107
+ "epoch": 0.94,
108
+ "eval_f1": 0.9271653543307087,
109
+ "eval_loss": 0.19784249365329742,
110
+ "eval_runtime": 12.076,
111
+ "eval_samples_per_second": 82.809,
112
+ "eval_steps_per_second": 10.351,
113
+ "step": 528
114
+ },
115
+ {
116
+ "epoch": 1.02,
117
+ "eval_f1": 0.9368104312938816,
118
+ "eval_loss": 0.17989766597747803,
119
+ "eval_runtime": 49.8486,
120
+ "eval_samples_per_second": 20.061,
121
+ "eval_steps_per_second": 2.508,
122
+ "step": 576
123
+ },
124
+ {
125
+ "epoch": 1.11,
126
+ "eval_f1": 0.895424836601307,
127
+ "eval_loss": 0.23422278463840485,
128
+ "eval_runtime": 11.6376,
129
+ "eval_samples_per_second": 85.928,
130
+ "eval_steps_per_second": 10.741,
131
+ "step": 624
132
+ },
133
+ {
134
+ "epoch": 1.19,
135
+ "eval_f1": 0.9256360078277887,
136
+ "eval_loss": 0.22150222957134247,
137
+ "eval_runtime": 11.4494,
138
+ "eval_samples_per_second": 87.341,
139
+ "eval_steps_per_second": 10.918,
140
+ "step": 672
141
+ },
142
+ {
143
+ "epoch": 1.28,
144
+ "eval_f1": 0.9051724137931034,
145
+ "eval_loss": 0.22654065489768982,
146
+ "eval_runtime": 11.6176,
147
+ "eval_samples_per_second": 86.076,
148
+ "eval_steps_per_second": 10.76,
149
+ "step": 720
150
+ },
151
+ {
152
+ "epoch": 1.36,
153
+ "eval_f1": 0.9389389389389389,
154
+ "eval_loss": 0.1583857387304306,
155
+ "eval_runtime": 15.3861,
156
+ "eval_samples_per_second": 64.994,
157
+ "eval_steps_per_second": 8.124,
158
+ "step": 768
159
+ },
160
+ {
161
+ "epoch": 1.45,
162
+ "eval_f1": 0.921487603305785,
163
+ "eval_loss": 0.22388193011283875,
164
+ "eval_runtime": 14.1559,
165
+ "eval_samples_per_second": 70.642,
166
+ "eval_steps_per_second": 8.83,
167
+ "step": 816
168
+ },
169
+ {
170
+ "epoch": 1.53,
171
+ "eval_f1": 0.9282868525896415,
172
+ "eval_loss": 0.1805724799633026,
173
+ "eval_runtime": 11.7527,
174
+ "eval_samples_per_second": 85.087,
175
+ "eval_steps_per_second": 10.636,
176
+ "step": 864
177
+ },
178
+ {
179
+ "epoch": 1.62,
180
+ "eval_f1": 0.8998899889988998,
181
+ "eval_loss": 0.22186490893363953,
182
+ "eval_runtime": 11.5055,
183
+ "eval_samples_per_second": 86.915,
184
+ "eval_steps_per_second": 10.864,
185
+ "step": 912
186
+ },
187
+ {
188
+ "epoch": 1.71,
189
+ "eval_f1": 0.9466263846928499,
190
+ "eval_loss": 0.15720757842063904,
191
+ "eval_runtime": 11.3153,
192
+ "eval_samples_per_second": 88.376,
193
+ "eval_steps_per_second": 11.047,
194
+ "step": 960
195
+ },
196
+ {
197
+ "epoch": 1.79,
198
+ "eval_f1": 0.9457523029682703,
199
+ "eval_loss": 0.15362103283405304,
200
+ "eval_runtime": 11.6626,
201
+ "eval_samples_per_second": 85.744,
202
+ "eval_steps_per_second": 10.718,
203
+ "step": 1008
204
+ },
205
+ {
206
+ "epoch": 1.88,
207
+ "eval_f1": 0.9403714565004888,
208
+ "eval_loss": 0.15603256225585938,
209
+ "eval_runtime": 11.4304,
210
+ "eval_samples_per_second": 87.486,
211
+ "eval_steps_per_second": 10.936,
212
+ "step": 1056
213
+ },
214
+ {
215
+ "epoch": 1.96,
216
+ "eval_f1": 0.9567901234567902,
217
+ "eval_loss": 0.13539032638072968,
218
+ "eval_runtime": 11.6426,
219
+ "eval_samples_per_second": 85.891,
220
+ "eval_steps_per_second": 10.736,
221
+ "step": 1104
222
+ },
223
+ {
224
+ "epoch": 2.0,
225
+ "learning_rate": 6.714031971580817e-05,
226
+ "loss": 0.2638,
227
+ "step": 1125
228
+ },
229
+ {
230
+ "epoch": 2.05,
231
+ "eval_f1": 0.9402390438247011,
232
+ "eval_loss": 0.2028977870941162,
233
+ "eval_runtime": 11.4905,
234
+ "eval_samples_per_second": 87.029,
235
+ "eval_steps_per_second": 10.879,
236
+ "step": 1152
237
+ },
238
+ {
239
+ "epoch": 2.13,
240
+ "eval_f1": 0.9477911646586347,
241
+ "eval_loss": 0.158633291721344,
242
+ "eval_runtime": 11.6696,
243
+ "eval_samples_per_second": 85.693,
244
+ "eval_steps_per_second": 10.712,
245
+ "step": 1200
246
+ },
247
+ {
248
+ "epoch": 2.22,
249
+ "eval_f1": 0.9363920750782065,
250
+ "eval_loss": 0.16604219377040863,
251
+ "eval_runtime": 11.6366,
252
+ "eval_samples_per_second": 85.936,
253
+ "eval_steps_per_second": 10.742,
254
+ "step": 1248
255
+ },
256
+ {
257
+ "epoch": 2.3,
258
+ "eval_f1": 0.946611909650924,
259
+ "eval_loss": 0.16741609573364258,
260
+ "eval_runtime": 11.5595,
261
+ "eval_samples_per_second": 86.509,
262
+ "eval_steps_per_second": 10.814,
263
+ "step": 1296
264
+ },
265
+ {
266
+ "epoch": 2.39,
267
+ "eval_f1": 0.9566094853683148,
268
+ "eval_loss": 0.15039804577827454,
269
+ "eval_runtime": 11.5775,
270
+ "eval_samples_per_second": 86.374,
271
+ "eval_steps_per_second": 10.797,
272
+ "step": 1344
273
+ },
274
+ {
275
+ "epoch": 2.47,
276
+ "eval_f1": 0.9386892177589852,
277
+ "eval_loss": 0.1896335780620575,
278
+ "eval_runtime": 11.4785,
279
+ "eval_samples_per_second": 87.12,
280
+ "eval_steps_per_second": 10.89,
281
+ "step": 1392
282
+ },
283
+ {
284
+ "epoch": 2.56,
285
+ "eval_f1": 0.9516129032258065,
286
+ "eval_loss": 0.1552370935678482,
287
+ "eval_runtime": 11.6346,
288
+ "eval_samples_per_second": 85.951,
289
+ "eval_steps_per_second": 10.744,
290
+ "step": 1440
291
+ },
292
+ {
293
+ "epoch": 2.64,
294
+ "eval_f1": 0.9494949494949494,
295
+ "eval_loss": 0.17198829352855682,
296
+ "eval_runtime": 11.4094,
297
+ "eval_samples_per_second": 87.647,
298
+ "eval_steps_per_second": 10.956,
299
+ "step": 1488
300
+ },
301
+ {
302
+ "epoch": 2.73,
303
+ "eval_f1": 0.9596774193548386,
304
+ "eval_loss": 0.14362381398677826,
305
+ "eval_runtime": 13.3792,
306
+ "eval_samples_per_second": 74.743,
307
+ "eval_steps_per_second": 9.343,
308
+ "step": 1536
309
+ },
310
+ {
311
+ "epoch": 2.81,
312
+ "eval_f1": 0.9530469530469531,
313
+ "eval_loss": 0.15035580098628998,
314
+ "eval_runtime": 12.9698,
315
+ "eval_samples_per_second": 77.102,
316
+ "eval_steps_per_second": 9.638,
317
+ "step": 1584
318
+ },
319
+ {
320
+ "epoch": 2.9,
321
+ "eval_f1": 0.9538461538461538,
322
+ "eval_loss": 0.1516994833946228,
323
+ "eval_runtime": 11.9429,
324
+ "eval_samples_per_second": 83.732,
325
+ "eval_steps_per_second": 10.466,
326
+ "step": 1632
327
+ },
328
+ {
329
+ "epoch": 2.98,
330
+ "eval_f1": 0.9538461538461538,
331
+ "eval_loss": 0.15105971693992615,
332
+ "eval_runtime": 13.9387,
333
+ "eval_samples_per_second": 71.743,
334
+ "eval_steps_per_second": 8.968,
335
+ "step": 1680
336
+ },
337
+ {
338
+ "epoch": 3.0,
339
+ "step": 1689,
340
+ "total_flos": 4.178103906557952e+18,
341
+ "train_loss": 0.20243481533847807,
342
+ "train_runtime": 2207.1281,
343
+ "train_samples_per_second": 24.466,
344
+ "train_steps_per_second": 0.765
345
+ }
346
+ ],
347
+ "max_steps": 1689,
348
+ "num_train_epochs": 3,
349
+ "total_flos": 4.178103906557952e+18,
350
+ "trial_name": null,
351
+ "trial_params": null
352
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a641abce807644e204c8c82075dd05c499575409b8d42ac15dc0273ce115f69
3
+ size 3887