bpdevai commited on
Commit
646d0b5
·
verified ·
1 Parent(s): 32858ce

Training in progress, epoch 5, checkpoint

Browse files
checkpoint-535/config.json CHANGED
@@ -1,69 +1,69 @@
1
- {
2
- "_name_or_path": "microsoft/conditional-detr-resnet-50",
3
- "activation_dropout": 0.0,
4
- "activation_function": "relu",
5
- "architectures": [
6
- "ConditionalDetrForObjectDetection"
7
- ],
8
- "attention_dropout": 0.0,
9
- "auxiliary_loss": false,
10
- "backbone": "resnet50",
11
- "backbone_config": null,
12
- "backbone_kwargs": {
13
- "in_chans": 3,
14
- "out_indices": [
15
- 1,
16
- 2,
17
- 3,
18
- 4
19
- ]
20
- },
21
- "bbox_cost": 5,
22
- "bbox_loss_coefficient": 5,
23
- "class_cost": 2,
24
- "cls_loss_coefficient": 2,
25
- "d_model": 256,
26
- "decoder_attention_heads": 8,
27
- "decoder_ffn_dim": 2048,
28
- "decoder_layerdrop": 0.0,
29
- "decoder_layers": 6,
30
- "dice_loss_coefficient": 1,
31
- "dilation": false,
32
- "dropout": 0.1,
33
- "encoder_attention_heads": 8,
34
- "encoder_ffn_dim": 2048,
35
- "encoder_layerdrop": 0.0,
36
- "encoder_layers": 6,
37
- "focal_alpha": 0.25,
38
- "giou_cost": 2,
39
- "giou_loss_coefficient": 2,
40
- "id2label": {
41
- "0": "Coverall",
42
- "1": "Face_Shield",
43
- "2": "Gloves",
44
- "3": "Goggles",
45
- "4": "Mask"
46
- },
47
- "init_std": 0.02,
48
- "init_xavier_std": 1.0,
49
- "is_encoder_decoder": true,
50
- "label2id": {
51
- "Coverall": 0,
52
- "Face_Shield": 1,
53
- "Gloves": 2,
54
- "Goggles": 3,
55
- "Mask": 4
56
- },
57
- "mask_loss_coefficient": 1,
58
- "max_position_embeddings": 1024,
59
- "model_type": "conditional_detr",
60
- "num_channels": 3,
61
- "num_hidden_layers": 6,
62
- "num_queries": 300,
63
- "position_embedding_type": "sine",
64
- "scale_embedding": false,
65
- "torch_dtype": "float32",
66
- "transformers_version": "4.42.0.dev0",
67
- "use_pretrained_backbone": true,
68
- "use_timm_backbone": true
69
- }
 
1
+ {
2
+ "_name_or_path": "microsoft/conditional-detr-resnet-50",
3
+ "activation_dropout": 0.0,
4
+ "activation_function": "relu",
5
+ "architectures": [
6
+ "ConditionalDetrForObjectDetection"
7
+ ],
8
+ "attention_dropout": 0.0,
9
+ "auxiliary_loss": false,
10
+ "backbone": "resnet50",
11
+ "backbone_config": null,
12
+ "backbone_kwargs": {
13
+ "in_chans": 3,
14
+ "out_indices": [
15
+ 1,
16
+ 2,
17
+ 3,
18
+ 4
19
+ ]
20
+ },
21
+ "bbox_cost": 5,
22
+ "bbox_loss_coefficient": 5,
23
+ "class_cost": 2,
24
+ "cls_loss_coefficient": 2,
25
+ "d_model": 256,
26
+ "decoder_attention_heads": 8,
27
+ "decoder_ffn_dim": 2048,
28
+ "decoder_layerdrop": 0.0,
29
+ "decoder_layers": 6,
30
+ "dice_loss_coefficient": 1,
31
+ "dilation": false,
32
+ "dropout": 0.1,
33
+ "encoder_attention_heads": 8,
34
+ "encoder_ffn_dim": 2048,
35
+ "encoder_layerdrop": 0.0,
36
+ "encoder_layers": 6,
37
+ "focal_alpha": 0.25,
38
+ "giou_cost": 2,
39
+ "giou_loss_coefficient": 2,
40
+ "id2label": {
41
+ "0": "Coverall",
42
+ "1": "Face_Shield",
43
+ "2": "Gloves",
44
+ "3": "Goggles",
45
+ "4": "Mask"
46
+ },
47
+ "init_std": 0.02,
48
+ "init_xavier_std": 1.0,
49
+ "is_encoder_decoder": true,
50
+ "label2id": {
51
+ "Coverall": 0,
52
+ "Face_Shield": 1,
53
+ "Gloves": 2,
54
+ "Goggles": 3,
55
+ "Mask": 4
56
+ },
57
+ "mask_loss_coefficient": 1,
58
+ "max_position_embeddings": 1024,
59
+ "model_type": "conditional_detr",
60
+ "num_channels": 3,
61
+ "num_hidden_layers": 6,
62
+ "num_queries": 300,
63
+ "position_embedding_type": "sine",
64
+ "scale_embedding": false,
65
+ "torch_dtype": "float32",
66
+ "transformers_version": "4.42.4",
67
+ "use_pretrained_backbone": true,
68
+ "use_timm_backbone": true
69
+ }
checkpoint-535/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8215f087a9f5bf98702b4ac5cdeaeeacbe8bd6a88141a191a846ece3c23017dd
3
  size 174079796
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7105d7eaf6c524d4c641a68ee5f123d924c0f62fa0e6e8a277009107ad117e42
3
  size 174079796
checkpoint-535/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c347fdff918d0c20191a4a836bdace3d5278f65e88bcdd07258a29726626454
3
- size 345687577
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8111ab4a6b7a610ad51077ffc81c6ea0e44ac1925a8b5c7726b51d2fd2a499db
3
+ size 345697817
checkpoint-535/preprocessor_config.json CHANGED
@@ -1,47 +1,26 @@
1
- {
2
- "_valid_processor_keys": [
3
- "images",
4
- "annotations",
5
- "return_segmentation_masks",
6
- "masks_path",
7
- "do_resize",
8
- "size",
9
- "resample",
10
- "do_rescale",
11
- "rescale_factor",
12
- "do_normalize",
13
- "do_convert_annotations",
14
- "image_mean",
15
- "image_std",
16
- "do_pad",
17
- "pad_size",
18
- "format",
19
- "return_tensors",
20
- "data_format",
21
- "input_data_format"
22
- ],
23
- "do_convert_annotations": true,
24
- "do_normalize": true,
25
- "do_pad": false,
26
- "do_rescale": true,
27
- "do_resize": false,
28
- "format": "coco_detection",
29
- "image_mean": [
30
- 0.485,
31
- 0.456,
32
- 0.406
33
- ],
34
- "image_processor_type": "ConditionalDetrImageProcessor",
35
- "image_std": [
36
- 0.229,
37
- 0.224,
38
- 0.225
39
- ],
40
- "pad_size": null,
41
- "resample": 2,
42
- "rescale_factor": 0.00392156862745098,
43
- "size": {
44
- "longest_edge": 1333,
45
- "shortest_edge": 800
46
- }
47
- }
 
1
+ {
2
+ "do_convert_annotations": true,
3
+ "do_normalize": true,
4
+ "do_pad": false,
5
+ "do_rescale": true,
6
+ "do_resize": false,
7
+ "format": "coco_detection",
8
+ "image_mean": [
9
+ 0.485,
10
+ 0.456,
11
+ 0.406
12
+ ],
13
+ "image_processor_type": "ConditionalDetrImageProcessor",
14
+ "image_std": [
15
+ 0.229,
16
+ 0.224,
17
+ 0.225
18
+ ],
19
+ "pad_size": null,
20
+ "resample": 2,
21
+ "rescale_factor": 0.00392156862745098,
22
+ "size": {
23
+ "longest_edge": 1333,
24
+ "shortest_edge": 800
25
+ }
26
+ }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-535/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a392b92abb441aca4c13e112d8e65c63f0a787044db3944e07d73ca395700c3
3
- size 13990
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ef183d3bea4051f4f4a902fc24c80ec974ace395a2ccebcf8a75d007246f905
3
+ size 14244
checkpoint-535/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff5026637c4bd3aa4963f3c9e1c74828911a22462e969a6ee3b6eea8b6e70288
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0885d6d5df69db7e2be573c02b967885e67d226ddcb3cf0af54d1bf50d441370
3
  size 1064
checkpoint-535/trainer_state.json CHANGED
@@ -1,340 +1,340 @@
1
- {
2
- "best_metric": 0.0041,
3
- "best_model_checkpoint": "test_detr_finetuned_cppe5/checkpoint-535",
4
- "epoch": 5.0,
5
- "eval_steps": 500,
6
- "global_step": 535,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 1.0,
13
- "step": 107,
14
- "train_loss": 3.2706406116485596,
15
- "train_map": 0.0002,
16
- "train_map_50": 0.0006,
17
- "train_map_75": 0.0001,
18
- "train_map_Coverall": 0.0007,
19
- "train_map_Face_Shield": 0.0,
20
- "train_map_Gloves": 0.0001,
21
- "train_map_Goggles": 0.0,
22
- "train_map_Mask": 0.0,
23
- "train_map_large": 0.0003,
24
- "train_map_medium": 0.0,
25
- "train_map_small": 0.0,
26
- "train_mar_1": 0.003,
27
- "train_mar_10": 0.0087,
28
- "train_mar_100": 0.0266,
29
- "train_mar_100_Coverall": 0.0956,
30
- "train_mar_100_Face_Shield": 0.0006,
31
- "train_mar_100_Gloves": 0.034,
32
- "train_mar_100_Goggles": 0.0013,
33
- "train_mar_100_Mask": 0.0016,
34
- "train_mar_large": 0.0244,
35
- "train_mar_medium": 0.0105,
36
- "train_mar_small": 0.002,
37
- "train_runtime": 75.6338,
38
- "train_samples_per_second": 11.238,
39
- "train_steps_per_second": 1.415
40
- },
41
- {
42
- "epoch": 1.0,
43
- "eval_loss": 3.281048059463501,
44
- "eval_map": 0.0001,
45
- "eval_map_50": 0.0005,
46
- "eval_map_75": 0.0,
47
- "eval_map_Coverall": 0.0005,
48
- "eval_map_Face_Shield": 0.0,
49
- "eval_map_Gloves": 0.0001,
50
- "eval_map_Goggles": 0.0,
51
- "eval_map_Mask": 0.0,
52
- "eval_map_large": 0.0002,
53
- "eval_map_medium": 0.0001,
54
- "eval_map_small": 0.0001,
55
- "eval_mar_1": 0.002,
56
- "eval_mar_10": 0.0057,
57
- "eval_mar_100": 0.0185,
58
- "eval_mar_100_Coverall": 0.0676,
59
- "eval_mar_100_Face_Shield": 0.0,
60
- "eval_mar_100_Gloves": 0.0246,
61
- "eval_mar_100_Goggles": 0.0,
62
- "eval_mar_100_Mask": 0.0004,
63
- "eval_mar_large": 0.0155,
64
- "eval_mar_medium": 0.0078,
65
- "eval_mar_small": 0.0027,
66
- "eval_runtime": 41.9051,
67
- "eval_samples_per_second": 3.58,
68
- "eval_steps_per_second": 0.453,
69
- "step": 107
70
- },
71
- {
72
- "epoch": 2.0,
73
- "step": 214,
74
- "train_loss": 3.312178373336792,
75
- "train_map": 0.0021,
76
- "train_map_50": 0.0092,
77
- "train_map_75": 0.0002,
78
- "train_map_Coverall": 0.0106,
79
- "train_map_Face_Shield": 0.0,
80
- "train_map_Gloves": 0.0,
81
- "train_map_Goggles": 0.0,
82
- "train_map_Mask": 0.0001,
83
- "train_map_large": 0.0023,
84
- "train_map_medium": 0.0001,
85
- "train_map_small": 0.0001,
86
- "train_mar_1": 0.0084,
87
- "train_mar_10": 0.0299,
88
- "train_mar_100": 0.0442,
89
- "train_mar_100_Coverall": 0.2058,
90
- "train_mar_100_Face_Shield": 0.0,
91
- "train_mar_100_Gloves": 0.015,
92
- "train_mar_100_Goggles": 0.0,
93
- "train_mar_100_Mask": 0.0001,
94
- "train_mar_large": 0.0452,
95
- "train_mar_medium": 0.0064,
96
- "train_mar_small": 0.0003,
97
- "train_runtime": 71.4629,
98
- "train_samples_per_second": 11.894,
99
- "train_steps_per_second": 1.497
100
- },
101
- {
102
- "epoch": 2.0,
103
- "eval_loss": 3.3038530349731445,
104
- "eval_map": 0.002,
105
- "eval_map_50": 0.0085,
106
- "eval_map_75": 0.0002,
107
- "eval_map_Coverall": 0.0098,
108
- "eval_map_Face_Shield": 0.0,
109
- "eval_map_Gloves": 0.0,
110
- "eval_map_Goggles": 0.0,
111
- "eval_map_Mask": 0.0,
112
- "eval_map_large": 0.0023,
113
- "eval_map_medium": 0.0,
114
- "eval_map_small": 0.0002,
115
- "eval_mar_1": 0.0058,
116
- "eval_mar_10": 0.0224,
117
- "eval_mar_100": 0.0351,
118
- "eval_mar_100_Coverall": 0.1644,
119
- "eval_mar_100_Face_Shield": 0.0,
120
- "eval_mar_100_Gloves": 0.0112,
121
- "eval_mar_100_Goggles": 0.0,
122
- "eval_mar_100_Mask": 0.0,
123
- "eval_mar_large": 0.0373,
124
- "eval_mar_medium": 0.006,
125
- "eval_mar_small": 0.0005,
126
- "eval_runtime": 36.9767,
127
- "eval_samples_per_second": 4.057,
128
- "eval_steps_per_second": 0.514,
129
- "step": 214
130
- },
131
- {
132
- "epoch": 3.0,
133
- "step": 321,
134
- "train_loss": 3.66046404838562,
135
- "train_map": 0.0004,
136
- "train_map_50": 0.0022,
137
- "train_map_75": 0.0,
138
- "train_map_Coverall": 0.0018,
139
- "train_map_Face_Shield": 0.0,
140
- "train_map_Gloves": 0.0,
141
- "train_map_Goggles": 0.0,
142
- "train_map_Mask": 0.0,
143
- "train_map_large": 0.0004,
144
- "train_map_medium": 0.0,
145
- "train_map_small": 0.0002,
146
- "train_mar_1": 0.0025,
147
- "train_mar_10": 0.0094,
148
- "train_mar_100": 0.0171,
149
- "train_mar_100_Coverall": 0.0597,
150
- "train_mar_100_Face_Shield": 0.0,
151
- "train_mar_100_Gloves": 0.0,
152
- "train_mar_100_Goggles": 0.0,
153
- "train_mar_100_Mask": 0.0259,
154
- "train_mar_large": 0.0126,
155
- "train_mar_medium": 0.0095,
156
- "train_mar_small": 0.0002,
157
- "train_runtime": 71.7786,
158
- "train_samples_per_second": 11.842,
159
- "train_steps_per_second": 1.491
160
- },
161
- {
162
- "epoch": 3.0,
163
- "eval_loss": 3.6040291786193848,
164
- "eval_map": 0.0007,
165
- "eval_map_50": 0.0032,
166
- "eval_map_75": 0.0,
167
- "eval_map_Coverall": 0.0035,
168
- "eval_map_Face_Shield": 0.0,
169
- "eval_map_Gloves": 0.0,
170
- "eval_map_Goggles": 0.0,
171
- "eval_map_Mask": 0.0,
172
- "eval_map_large": 0.0007,
173
- "eval_map_medium": 0.0,
174
- "eval_map_small": 0.0,
175
- "eval_mar_1": 0.0017,
176
- "eval_mar_10": 0.0077,
177
- "eval_mar_100": 0.0126,
178
- "eval_mar_100_Coverall": 0.0486,
179
- "eval_mar_100_Face_Shield": 0.0,
180
- "eval_mar_100_Gloves": 0.0,
181
- "eval_mar_100_Goggles": 0.0,
182
- "eval_mar_100_Mask": 0.0142,
183
- "eval_mar_large": 0.0111,
184
- "eval_mar_medium": 0.007,
185
- "eval_mar_small": 0.0,
186
- "eval_runtime": 36.2619,
187
- "eval_samples_per_second": 4.137,
188
- "eval_steps_per_second": 0.524,
189
- "step": 321
190
- },
191
- {
192
- "epoch": 4.0,
193
- "step": 428,
194
- "train_loss": 3.2305893898010254,
195
- "train_map": 0.001,
196
- "train_map_50": 0.0041,
197
- "train_map_75": 0.0001,
198
- "train_map_Coverall": 0.0052,
199
- "train_map_Face_Shield": 0.0,
200
- "train_map_Gloves": 0.0,
201
- "train_map_Goggles": 0.0,
202
- "train_map_Mask": 0.0,
203
- "train_map_large": 0.0011,
204
- "train_map_medium": 0.0,
205
- "train_map_small": 0.0004,
206
- "train_mar_1": 0.0027,
207
- "train_mar_10": 0.0234,
208
- "train_mar_100": 0.054,
209
- "train_mar_100_Coverall": 0.2667,
210
- "train_mar_100_Face_Shield": 0.0,
211
- "train_mar_100_Gloves": 0.0025,
212
- "train_mar_100_Goggles": 0.0,
213
- "train_mar_100_Mask": 0.0008,
214
- "train_mar_large": 0.0563,
215
- "train_mar_medium": 0.001,
216
- "train_mar_small": 0.0001,
217
- "train_runtime": 68.5556,
218
- "train_samples_per_second": 12.399,
219
- "train_steps_per_second": 1.561
220
- },
221
- {
222
- "epoch": 4.0,
223
- "eval_loss": 3.286728858947754,
224
- "eval_map": 0.0006,
225
- "eval_map_50": 0.0028,
226
- "eval_map_75": 0.0001,
227
- "eval_map_Coverall": 0.0032,
228
- "eval_map_Face_Shield": 0.0,
229
- "eval_map_Gloves": 0.0,
230
- "eval_map_Goggles": 0.0,
231
- "eval_map_Mask": 0.0,
232
- "eval_map_large": 0.0007,
233
- "eval_map_medium": 0.0,
234
- "eval_map_small": 0.0,
235
- "eval_mar_1": 0.0016,
236
- "eval_mar_10": 0.0152,
237
- "eval_mar_100": 0.0368,
238
- "eval_mar_100_Coverall": 0.1833,
239
- "eval_mar_100_Face_Shield": 0.0,
240
- "eval_mar_100_Gloves": 0.0004,
241
- "eval_mar_100_Goggles": 0.0,
242
- "eval_mar_100_Mask": 0.0004,
243
- "eval_mar_large": 0.042,
244
- "eval_mar_medium": 0.0004,
245
- "eval_mar_small": 0.0,
246
- "eval_runtime": 35.94,
247
- "eval_samples_per_second": 4.174,
248
- "eval_steps_per_second": 0.529,
249
- "step": 428
250
- },
251
- {
252
- "epoch": 4.672897196261682,
253
- "grad_norm": 96.62178802490234,
254
- "learning_rate": 4.97310930008156e-05,
255
- "loss": 5.244,
256
- "step": 500
257
- },
258
- {
259
- "epoch": 5.0,
260
- "step": 535,
261
- "train_loss": 3.113837957382202,
262
- "train_map": 0.0047,
263
- "train_map_50": 0.0141,
264
- "train_map_75": 0.0021,
265
- "train_map_Coverall": 0.0236,
266
- "train_map_Face_Shield": 0.0,
267
- "train_map_Gloves": 0.0,
268
- "train_map_Goggles": 0.0,
269
- "train_map_Mask": 0.0,
270
- "train_map_large": 0.005,
271
- "train_map_medium": 0.0,
272
- "train_map_small": 0.0,
273
- "train_mar_1": 0.0147,
274
- "train_mar_10": 0.0356,
275
- "train_mar_100": 0.0795,
276
- "train_mar_100_Coverall": 0.3905,
277
- "train_mar_100_Face_Shield": 0.0,
278
- "train_mar_100_Gloves": 0.0061,
279
- "train_mar_100_Goggles": 0.0,
280
- "train_mar_100_Mask": 0.0007,
281
- "train_mar_large": 0.0824,
282
- "train_mar_medium": 0.0023,
283
- "train_mar_small": 0.0,
284
- "train_runtime": 69.5355,
285
- "train_samples_per_second": 12.224,
286
- "train_steps_per_second": 1.539
287
- },
288
- {
289
- "epoch": 5.0,
290
- "eval_loss": 3.183504581451416,
291
- "eval_map": 0.0041,
292
- "eval_map_50": 0.0123,
293
- "eval_map_75": 0.0031,
294
- "eval_map_Coverall": 0.0203,
295
- "eval_map_Face_Shield": 0.0,
296
- "eval_map_Gloves": 0.0,
297
- "eval_map_Goggles": 0.0,
298
- "eval_map_Mask": 0.0,
299
- "eval_map_large": 0.0046,
300
- "eval_map_medium": 0.0,
301
- "eval_map_small": 0.0,
302
- "eval_mar_1": 0.0092,
303
- "eval_mar_10": 0.0232,
304
- "eval_mar_100": 0.0572,
305
- "eval_mar_100_Coverall": 0.2829,
306
- "eval_mar_100_Face_Shield": 0.0,
307
- "eval_mar_100_Gloves": 0.0031,
308
- "eval_mar_100_Goggles": 0.0,
309
- "eval_mar_100_Mask": 0.0,
310
- "eval_mar_large": 0.0647,
311
- "eval_mar_medium": 0.0012,
312
- "eval_mar_small": 0.0,
313
- "eval_runtime": 36.8768,
314
- "eval_samples_per_second": 4.068,
315
- "eval_steps_per_second": 0.515,
316
- "step": 535
317
- }
318
- ],
319
- "logging_steps": 500,
320
- "max_steps": 10700,
321
- "num_input_tokens_seen": 0,
322
- "num_train_epochs": 100,
323
- "save_steps": 500,
324
- "stateful_callbacks": {
325
- "TrainerControl": {
326
- "args": {
327
- "should_epoch_stop": false,
328
- "should_evaluate": false,
329
- "should_log": false,
330
- "should_save": true,
331
- "should_training_stop": false
332
- },
333
- "attributes": {}
334
- }
335
- },
336
- "total_flos": 7.635321615744e+17,
337
- "train_batch_size": 8,
338
- "trial_name": null,
339
- "trial_params": null
340
- }
 
1
+ {
2
+ "best_metric": 0.122,
3
+ "best_model_checkpoint": "test_detr_finetuned_cppe5\\checkpoint-535",
4
+ "epoch": 5.0,
5
+ "eval_steps": 500,
6
+ "global_step": 535,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "step": 107,
14
+ "train_loss": 2.531707286834717,
15
+ "train_map": 0.0033,
16
+ "train_map_50": 0.0117,
17
+ "train_map_75": 0.0011,
18
+ "train_map_Coverall": 0.0032,
19
+ "train_map_Face_Shield": 0.0001,
20
+ "train_map_Gloves": 0.0049,
21
+ "train_map_Goggles": 0.0,
22
+ "train_map_Mask": 0.0081,
23
+ "train_map_large": 0.0063,
24
+ "train_map_medium": 0.0037,
25
+ "train_map_small": 0.0017,
26
+ "train_mar_1": 0.0094,
27
+ "train_mar_10": 0.0727,
28
+ "train_mar_100": 0.1382,
29
+ "train_mar_100_Coverall": 0.2272,
30
+ "train_mar_100_Face_Shield": 0.0201,
31
+ "train_mar_100_Gloves": 0.199,
32
+ "train_mar_100_Goggles": 0.0,
33
+ "train_mar_100_Mask": 0.2445,
34
+ "train_mar_large": 0.0983,
35
+ "train_mar_medium": 0.1363,
36
+ "train_mar_small": 0.0346,
37
+ "train_runtime": 29.266,
38
+ "train_samples_per_second": 29.044,
39
+ "train_steps_per_second": 3.656
40
+ },
41
+ {
42
+ "epoch": 1.0,
43
+ "eval_loss": 2.618133068084717,
44
+ "eval_map": 0.0023,
45
+ "eval_map_50": 0.0084,
46
+ "eval_map_75": 0.0006,
47
+ "eval_map_Coverall": 0.0025,
48
+ "eval_map_Face_Shield": 0.0002,
49
+ "eval_map_Gloves": 0.0026,
50
+ "eval_map_Goggles": 0.0,
51
+ "eval_map_Mask": 0.0062,
52
+ "eval_map_large": 0.0075,
53
+ "eval_map_medium": 0.0029,
54
+ "eval_map_small": 0.0019,
55
+ "eval_mar_1": 0.0082,
56
+ "eval_mar_10": 0.0496,
57
+ "eval_mar_100": 0.1009,
58
+ "eval_mar_100_Coverall": 0.1667,
59
+ "eval_mar_100_Face_Shield": 0.0152,
60
+ "eval_mar_100_Gloves": 0.1442,
61
+ "eval_mar_100_Goggles": 0.0,
62
+ "eval_mar_100_Mask": 0.1782,
63
+ "eval_mar_large": 0.1089,
64
+ "eval_mar_medium": 0.1196,
65
+ "eval_mar_small": 0.0338,
66
+ "eval_runtime": 10.5496,
67
+ "eval_samples_per_second": 14.218,
68
+ "eval_steps_per_second": 1.801,
69
+ "step": 107
70
+ },
71
+ {
72
+ "epoch": 2.0,
73
+ "step": 214,
74
+ "train_loss": 2.1007583141326904,
75
+ "train_map": 0.0405,
76
+ "train_map_50": 0.0973,
77
+ "train_map_75": 0.0262,
78
+ "train_map_Coverall": 0.0862,
79
+ "train_map_Face_Shield": 0.0034,
80
+ "train_map_Gloves": 0.0161,
81
+ "train_map_Goggles": 0.0014,
82
+ "train_map_Mask": 0.0954,
83
+ "train_map_large": 0.0499,
84
+ "train_map_medium": 0.0351,
85
+ "train_map_small": 0.0156,
86
+ "train_mar_1": 0.1017,
87
+ "train_mar_10": 0.2491,
88
+ "train_mar_100": 0.2902,
89
+ "train_mar_100_Coverall": 0.5555,
90
+ "train_mar_100_Face_Shield": 0.1718,
91
+ "train_mar_100_Gloves": 0.2798,
92
+ "train_mar_100_Goggles": 0.0571,
93
+ "train_mar_100_Mask": 0.3865,
94
+ "train_mar_large": 0.2549,
95
+ "train_mar_medium": 0.2432,
96
+ "train_mar_small": 0.1161,
97
+ "train_runtime": 26.5597,
98
+ "train_samples_per_second": 32.003,
99
+ "train_steps_per_second": 4.029
100
+ },
101
+ {
102
+ "epoch": 2.0,
103
+ "eval_loss": 2.251506805419922,
104
+ "eval_map": 0.0386,
105
+ "eval_map_50": 0.0946,
106
+ "eval_map_75": 0.0261,
107
+ "eval_map_Coverall": 0.1234,
108
+ "eval_map_Face_Shield": 0.005,
109
+ "eval_map_Gloves": 0.0102,
110
+ "eval_map_Goggles": 0.0011,
111
+ "eval_map_Mask": 0.0531,
112
+ "eval_map_large": 0.0645,
113
+ "eval_map_medium": 0.0251,
114
+ "eval_map_small": 0.0109,
115
+ "eval_mar_1": 0.0744,
116
+ "eval_mar_10": 0.1938,
117
+ "eval_mar_100": 0.2324,
118
+ "eval_mar_100_Coverall": 0.4653,
119
+ "eval_mar_100_Face_Shield": 0.1722,
120
+ "eval_mar_100_Gloves": 0.2165,
121
+ "eval_mar_100_Goggles": 0.0277,
122
+ "eval_mar_100_Mask": 0.2804,
123
+ "eval_mar_large": 0.3155,
124
+ "eval_mar_medium": 0.2153,
125
+ "eval_mar_small": 0.0878,
126
+ "eval_runtime": 9.8776,
127
+ "eval_samples_per_second": 15.186,
128
+ "eval_steps_per_second": 1.924,
129
+ "step": 214
130
+ },
131
+ {
132
+ "epoch": 3.0,
133
+ "step": 321,
134
+ "train_loss": 1.8027496337890625,
135
+ "train_map": 0.0689,
136
+ "train_map_50": 0.1515,
137
+ "train_map_75": 0.053,
138
+ "train_map_Coverall": 0.1899,
139
+ "train_map_Face_Shield": 0.0098,
140
+ "train_map_Gloves": 0.0287,
141
+ "train_map_Goggles": 0.0123,
142
+ "train_map_Mask": 0.104,
143
+ "train_map_large": 0.0958,
144
+ "train_map_medium": 0.0492,
145
+ "train_map_small": 0.0201,
146
+ "train_mar_1": 0.1643,
147
+ "train_mar_10": 0.3427,
148
+ "train_mar_100": 0.3901,
149
+ "train_mar_100_Coverall": 0.6673,
150
+ "train_mar_100_Face_Shield": 0.3124,
151
+ "train_mar_100_Gloves": 0.3556,
152
+ "train_mar_100_Goggles": 0.2114,
153
+ "train_mar_100_Mask": 0.4038,
154
+ "train_mar_large": 0.4421,
155
+ "train_mar_medium": 0.3085,
156
+ "train_mar_small": 0.1399,
157
+ "train_runtime": 25.8607,
158
+ "train_samples_per_second": 32.868,
159
+ "train_steps_per_second": 4.138
160
+ },
161
+ {
162
+ "epoch": 3.0,
163
+ "eval_loss": 1.9757874011993408,
164
+ "eval_map": 0.0539,
165
+ "eval_map_50": 0.1302,
166
+ "eval_map_75": 0.0411,
167
+ "eval_map_Coverall": 0.1643,
168
+ "eval_map_Face_Shield": 0.0092,
169
+ "eval_map_Gloves": 0.0261,
170
+ "eval_map_Goggles": 0.0098,
171
+ "eval_map_Mask": 0.0601,
172
+ "eval_map_large": 0.1194,
173
+ "eval_map_medium": 0.0401,
174
+ "eval_map_small": 0.0231,
175
+ "eval_mar_1": 0.1144,
176
+ "eval_mar_10": 0.2597,
177
+ "eval_mar_100": 0.304,
178
+ "eval_mar_100_Coverall": 0.5284,
179
+ "eval_mar_100_Face_Shield": 0.243,
180
+ "eval_mar_100_Gloves": 0.2942,
181
+ "eval_mar_100_Goggles": 0.1446,
182
+ "eval_mar_100_Mask": 0.3098,
183
+ "eval_mar_large": 0.4992,
184
+ "eval_mar_medium": 0.259,
185
+ "eval_mar_small": 0.1355,
186
+ "eval_runtime": 9.6967,
187
+ "eval_samples_per_second": 15.469,
188
+ "eval_steps_per_second": 1.959,
189
+ "step": 321
190
+ },
191
+ {
192
+ "epoch": 4.0,
193
+ "step": 428,
194
+ "train_loss": 1.6371513605117798,
195
+ "train_map": 0.1256,
196
+ "train_map_50": 0.2579,
197
+ "train_map_75": 0.1074,
198
+ "train_map_Coverall": 0.3276,
199
+ "train_map_Face_Shield": 0.0195,
200
+ "train_map_Gloves": 0.0689,
201
+ "train_map_Goggles": 0.0266,
202
+ "train_map_Mask": 0.1852,
203
+ "train_map_large": 0.1425,
204
+ "train_map_medium": 0.094,
205
+ "train_map_small": 0.0312,
206
+ "train_mar_1": 0.2065,
207
+ "train_mar_10": 0.4048,
208
+ "train_mar_100": 0.4399,
209
+ "train_mar_100_Coverall": 0.7245,
210
+ "train_mar_100_Face_Shield": 0.3362,
211
+ "train_mar_100_Gloves": 0.3539,
212
+ "train_mar_100_Goggles": 0.3075,
213
+ "train_mar_100_Mask": 0.4775,
214
+ "train_mar_large": 0.5627,
215
+ "train_mar_medium": 0.3551,
216
+ "train_mar_small": 0.1666,
217
+ "train_runtime": 29.1332,
218
+ "train_samples_per_second": 29.176,
219
+ "train_steps_per_second": 3.673
220
+ },
221
+ {
222
+ "epoch": 4.0,
223
+ "eval_loss": 1.8584269285202026,
224
+ "eval_map": 0.0933,
225
+ "eval_map_50": 0.2047,
226
+ "eval_map_75": 0.0782,
227
+ "eval_map_Coverall": 0.2757,
228
+ "eval_map_Face_Shield": 0.0127,
229
+ "eval_map_Gloves": 0.04,
230
+ "eval_map_Goggles": 0.0208,
231
+ "eval_map_Mask": 0.1173,
232
+ "eval_map_large": 0.1536,
233
+ "eval_map_medium": 0.0659,
234
+ "eval_map_small": 0.0271,
235
+ "eval_mar_1": 0.1454,
236
+ "eval_mar_10": 0.3083,
237
+ "eval_mar_100": 0.3419,
238
+ "eval_mar_100_Coverall": 0.605,
239
+ "eval_mar_100_Face_Shield": 0.2519,
240
+ "eval_mar_100_Gloves": 0.2763,
241
+ "eval_mar_100_Goggles": 0.2354,
242
+ "eval_mar_100_Mask": 0.3409,
243
+ "eval_mar_large": 0.5593,
244
+ "eval_mar_medium": 0.2956,
245
+ "eval_mar_small": 0.1551,
246
+ "eval_runtime": 11.7158,
247
+ "eval_samples_per_second": 12.803,
248
+ "eval_steps_per_second": 1.622,
249
+ "step": 428
250
+ },
251
+ {
252
+ "epoch": 4.672897196261682,
253
+ "grad_norm": 17.656822204589844,
254
+ "learning_rate": 4.97310930008156e-05,
255
+ "loss": 4.0731,
256
+ "step": 500
257
+ },
258
+ {
259
+ "epoch": 5.0,
260
+ "step": 535,
261
+ "train_loss": 1.5120447874069214,
262
+ "train_map": 0.1712,
263
+ "train_map_50": 0.3563,
264
+ "train_map_75": 0.1466,
265
+ "train_map_Coverall": 0.4435,
266
+ "train_map_Face_Shield": 0.0746,
267
+ "train_map_Gloves": 0.0904,
268
+ "train_map_Goggles": 0.0174,
269
+ "train_map_Mask": 0.2302,
270
+ "train_map_large": 0.2072,
271
+ "train_map_medium": 0.1168,
272
+ "train_map_small": 0.0514,
273
+ "train_mar_1": 0.2393,
274
+ "train_mar_10": 0.4484,
275
+ "train_mar_100": 0.4809,
276
+ "train_mar_100_Coverall": 0.7121,
277
+ "train_mar_100_Face_Shield": 0.4876,
278
+ "train_mar_100_Gloves": 0.4058,
279
+ "train_mar_100_Goggles": 0.301,
280
+ "train_mar_100_Mask": 0.4979,
281
+ "train_mar_large": 0.6526,
282
+ "train_mar_medium": 0.394,
283
+ "train_mar_small": 0.2152,
284
+ "train_runtime": 25.2419,
285
+ "train_samples_per_second": 33.674,
286
+ "train_steps_per_second": 4.239
287
+ },
288
+ {
289
+ "epoch": 5.0,
290
+ "eval_loss": 1.7863460779190063,
291
+ "eval_map": 0.122,
292
+ "eval_map_50": 0.266,
293
+ "eval_map_75": 0.107,
294
+ "eval_map_Coverall": 0.3757,
295
+ "eval_map_Face_Shield": 0.047,
296
+ "eval_map_Gloves": 0.0488,
297
+ "eval_map_Goggles": 0.0105,
298
+ "eval_map_Mask": 0.1283,
299
+ "eval_map_large": 0.218,
300
+ "eval_map_medium": 0.0869,
301
+ "eval_map_small": 0.0417,
302
+ "eval_mar_1": 0.175,
303
+ "eval_mar_10": 0.3379,
304
+ "eval_mar_100": 0.3696,
305
+ "eval_mar_100_Coverall": 0.6068,
306
+ "eval_mar_100_Face_Shield": 0.4089,
307
+ "eval_mar_100_Gloves": 0.2759,
308
+ "eval_mar_100_Goggles": 0.2138,
309
+ "eval_mar_100_Mask": 0.3427,
310
+ "eval_mar_large": 0.6453,
311
+ "eval_mar_medium": 0.328,
312
+ "eval_mar_small": 0.1947,
313
+ "eval_runtime": 9.6261,
314
+ "eval_samples_per_second": 15.583,
315
+ "eval_steps_per_second": 1.974,
316
+ "step": 535
317
+ }
318
+ ],
319
+ "logging_steps": 500,
320
+ "max_steps": 10700,
321
+ "num_input_tokens_seen": 0,
322
+ "num_train_epochs": 100,
323
+ "save_steps": 500,
324
+ "stateful_callbacks": {
325
+ "TrainerControl": {
326
+ "args": {
327
+ "should_epoch_stop": false,
328
+ "should_evaluate": false,
329
+ "should_log": false,
330
+ "should_save": true,
331
+ "should_training_stop": false
332
+ },
333
+ "attributes": {}
334
+ }
335
+ },
336
+ "total_flos": 7.635321615744e+17,
337
+ "train_batch_size": 8,
338
+ "trial_name": null,
339
+ "trial_params": null
340
+ }
checkpoint-535/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70ab6612c795f2330a136ddf97d7c6e0ba7798175cc9cae994cc3f067700c650
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aed3eb8d6db83a01a4da94998232d2b334cd1e141aeaa94f3c5559fdda758c8e
3
  size 5176