LightningNO1 commited on
Commit
4c86dc8
·
verified ·
1 Parent(s): 6f8d140

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ ss_100base/step1/metrics.json filter=lfs diff=lfs merge=lfs -text
ps_100base/step1/config.yaml ADDED
@@ -0,0 +1,454 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CONT:
2
+ ADD_POS: false
3
+ BASE_CLS: 100
4
+ COLLECT_QUERY_MODE: false
5
+ COMBINE_PSDLABEL: false
6
+ CUMULATIVE_PSDNUM: false
7
+ DISTRIBUTION_ALPHA: 0.5
8
+ FILTER_KD: false
9
+ FREEZE_LABEL: false
10
+ INC_CLS: 5
11
+ KD_DECODER: true
12
+ KD_TEMPERATURE: 1.0
13
+ KD_TEMPERATURE2: 1.0
14
+ KD_TYPE: kl
15
+ KL_ALL: true
16
+ KL_WEIGHT: 2.0
17
+ LIB_SIZE: 80
18
+ MED_TOKENS_WEIGHT: 5.0
19
+ MEMORY: false
20
+ MPATH: memory/pan
21
+ OLD_MODEL: true
22
+ OLD_WEIGHTS: null
23
+ PSD_LABEL_THRESHOLD: 0.35
24
+ PSD_OVERLAP_THRESHOLD: 0.8
25
+ SETTING: overlapped
26
+ TASK: 1
27
+ TOT_CLS: 150
28
+ VQ_NUMBER: 3
29
+ VQ_STORE: false
30
+ WEIGHTED_SAMPLE: true
31
+ WEIGHTS: null
32
+ CUDNN_BENCHMARK: false
33
+ DATALOADER:
34
+ ASPECT_RATIO_GROUPING: true
35
+ FILTER_EMPTY_ANNOTATIONS: true
36
+ NUM_WORKERS: 2
37
+ REPEAT_SQRT: true
38
+ REPEAT_THRESHOLD: 0.0
39
+ SAMPLER_TRAIN: TrainingSampler
40
+ DATASETS:
41
+ PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
42
+ PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
43
+ PROPOSAL_FILES_TEST: []
44
+ PROPOSAL_FILES_TRAIN: []
45
+ TEST:
46
+ - current_ade20k_panoptic_val
47
+ TRAIN:
48
+ - current_ade20k_panoptic_train
49
+ GLOBAL:
50
+ HACK: 1.0
51
+ INPUT:
52
+ COLOR_AUG_SSD: true
53
+ CROP:
54
+ ENABLED: true
55
+ SINGLE_CATEGORY_MAX_AREA: 1.0
56
+ SIZE:
57
+ - 640
58
+ - 640
59
+ TYPE: absolute
60
+ DATASET_MAPPER_NAME: continual_panoptic
61
+ FORMAT: RGB
62
+ IMAGE_SIZE: 1024
63
+ MASK_FORMAT: polygon
64
+ MAX_SCALE: 2.0
65
+ MAX_SIZE_TEST: 2560
66
+ MAX_SIZE_TRAIN: 2560
67
+ MIN_SCALE: 0.1
68
+ MIN_SIZE_TEST: 640
69
+ MIN_SIZE_TRAIN:
70
+ - 320
71
+ - 384
72
+ - 448
73
+ - 512
74
+ - 576
75
+ - 640
76
+ - 704
77
+ - 768
78
+ - 832
79
+ - 896
80
+ - 960
81
+ - 1024
82
+ - 1088
83
+ - 1152
84
+ - 1216
85
+ - 1280
86
+ MIN_SIZE_TRAIN_SAMPLING: choice
87
+ RANDOM_FLIP: horizontal
88
+ SIZE_DIVISIBILITY: 640
89
+ MODEL:
90
+ ANCHOR_GENERATOR:
91
+ ANGLES:
92
+ - - -90
93
+ - 0
94
+ - 90
95
+ ASPECT_RATIOS:
96
+ - - 0.5
97
+ - 1.0
98
+ - 2.0
99
+ NAME: DefaultAnchorGenerator
100
+ OFFSET: 0.0
101
+ SIZES:
102
+ - - 32
103
+ - 64
104
+ - 128
105
+ - 256
106
+ - 512
107
+ BACKBONE:
108
+ FREEZE_AT: 0
109
+ NAME: build_resnet_backbone
110
+ DEVICE: cuda
111
+ FPN:
112
+ FUSE_TYPE: sum
113
+ IN_FEATURES: []
114
+ NORM: ''
115
+ OUT_CHANNELS: 256
116
+ KEYPOINT_ON: false
117
+ LOAD_PROPOSALS: false
118
+ MASK_FORMER:
119
+ CLASS_WEIGHT: 4.0
120
+ CLIP_DIM: 768
121
+ DEC_LAYERS: 10
122
+ DEEP_SUPERVISION: true
123
+ DICE_WEIGHT: 5.0
124
+ DIM_FEEDFORWARD: 2048
125
+ DROPOUT: 0.0
126
+ ENC_LAYERS: 0
127
+ ENFORCE_INPUT_PROJ: false
128
+ HIDDEN_DIM: 256
129
+ IMPORTANCE_SAMPLE_RATIO: 0.75
130
+ MASK_WEIGHT: 5.0
131
+ NHEADS: 8
132
+ NO_OBJECT_WEIGHT: 0.1
133
+ NUM_OBJECT_QUERIES: 100
134
+ OVERSAMPLE_RATIO: 3.0
135
+ PRE_NORM: false
136
+ SIZE_DIVISIBILITY: 32
137
+ TEST:
138
+ INSTANCE_ON: true
139
+ OBJECT_MASK_THRESHOLD: 0.25
140
+ OVERLAP_THRESHOLD: 0.8
141
+ PANOPTIC_ON: true
142
+ SEMANTIC_ON: true
143
+ SEM_SEG_POSTPROCESSING_BEFORE_INFERENCE: false
144
+ TEXT_PATH: label_embedding/ade20k_150_laion768_all.npy
145
+ TRAIN_NUM_POINTS: 12544
146
+ TRANSFORMER_DECODER_NAME: MultiScaleMaskedTransformerDecoder
147
+ TRANSFORMER_IN_FEATURE: multi_scale_pixel_decoder
148
+ USE_TEXT_EMBEDDING: false
149
+ MASK_ON: false
150
+ META_ARCHITECTURE: MaskFormer
151
+ PANOPTIC_FPN:
152
+ COMBINE:
153
+ ENABLED: true
154
+ INSTANCES_CONFIDENCE_THRESH: 0.5
155
+ OVERLAP_THRESH: 0.5
156
+ STUFF_AREA_LIMIT: 4096
157
+ INSTANCE_LOSS_WEIGHT: 1.0
158
+ PIXEL_MEAN:
159
+ - 123.675
160
+ - 116.28
161
+ - 103.53
162
+ PIXEL_STD:
163
+ - 58.395
164
+ - 57.12
165
+ - 57.375
166
+ PROPOSAL_GENERATOR:
167
+ MIN_SIZE: 0
168
+ NAME: RPN
169
+ RESNETS:
170
+ DEFORM_MODULATED: false
171
+ DEFORM_NUM_GROUPS: 1
172
+ DEFORM_ON_PER_STAGE:
173
+ - false
174
+ - false
175
+ - false
176
+ - false
177
+ DEPTH: 50
178
+ NORM: FrozenBN
179
+ NUM_GROUPS: 1
180
+ OUT_FEATURES:
181
+ - res2
182
+ - res3
183
+ - res4
184
+ - res5
185
+ RES2_OUT_CHANNELS: 256
186
+ RES4_DILATION: 1
187
+ RES5_DILATION: 1
188
+ RES5_MULTI_GRID:
189
+ - 1
190
+ - 1
191
+ - 1
192
+ STEM_OUT_CHANNELS: 64
193
+ STEM_TYPE: basic
194
+ STRIDE_IN_1X1: false
195
+ WIDTH_PER_GROUP: 64
196
+ RETINANET:
197
+ BBOX_REG_LOSS_TYPE: smooth_l1
198
+ BBOX_REG_WEIGHTS: &id002
199
+ - 1.0
200
+ - 1.0
201
+ - 1.0
202
+ - 1.0
203
+ FOCAL_LOSS_ALPHA: 0.25
204
+ FOCAL_LOSS_GAMMA: 2.0
205
+ IN_FEATURES:
206
+ - p3
207
+ - p4
208
+ - p5
209
+ - p6
210
+ - p7
211
+ IOU_LABELS:
212
+ - 0
213
+ - -1
214
+ - 1
215
+ IOU_THRESHOLDS:
216
+ - 0.4
217
+ - 0.5
218
+ NMS_THRESH_TEST: 0.5
219
+ NORM: ''
220
+ NUM_CLASSES: 80
221
+ NUM_CONVS: 4
222
+ PRIOR_PROB: 0.01
223
+ SCORE_THRESH_TEST: 0.05
224
+ SMOOTH_L1_LOSS_BETA: 0.1
225
+ TOPK_CANDIDATES_TEST: 1000
226
+ ROI_BOX_CASCADE_HEAD:
227
+ BBOX_REG_WEIGHTS:
228
+ - &id001
229
+ - 10.0
230
+ - 10.0
231
+ - 5.0
232
+ - 5.0
233
+ - - 20.0
234
+ - 20.0
235
+ - 10.0
236
+ - 10.0
237
+ - - 30.0
238
+ - 30.0
239
+ - 15.0
240
+ - 15.0
241
+ IOUS:
242
+ - 0.5
243
+ - 0.6
244
+ - 0.7
245
+ ROI_BOX_HEAD:
246
+ BBOX_REG_LOSS_TYPE: smooth_l1
247
+ BBOX_REG_LOSS_WEIGHT: 1.0
248
+ BBOX_REG_WEIGHTS: *id001
249
+ CLS_AGNOSTIC_BBOX_REG: false
250
+ CONV_DIM: 256
251
+ FC_DIM: 1024
252
+ FED_LOSS_FREQ_WEIGHT_POWER: 0.5
253
+ FED_LOSS_NUM_CLASSES: 50
254
+ NAME: ''
255
+ NORM: ''
256
+ NUM_CONV: 0
257
+ NUM_FC: 0
258
+ POOLER_RESOLUTION: 14
259
+ POOLER_SAMPLING_RATIO: 0
260
+ POOLER_TYPE: ROIAlignV2
261
+ SMOOTH_L1_BETA: 0.0
262
+ TRAIN_ON_PRED_BOXES: false
263
+ USE_FED_LOSS: false
264
+ USE_SIGMOID_CE: false
265
+ ROI_HEADS:
266
+ BATCH_SIZE_PER_IMAGE: 512
267
+ IN_FEATURES:
268
+ - res4
269
+ IOU_LABELS:
270
+ - 0
271
+ - 1
272
+ IOU_THRESHOLDS:
273
+ - 0.5
274
+ NAME: Res5ROIHeads
275
+ NMS_THRESH_TEST: 0.5
276
+ NUM_CLASSES: 80
277
+ POSITIVE_FRACTION: 0.25
278
+ PROPOSAL_APPEND_GT: true
279
+ SCORE_THRESH_TEST: 0.05
280
+ ROI_KEYPOINT_HEAD:
281
+ CONV_DIMS:
282
+ - 512
283
+ - 512
284
+ - 512
285
+ - 512
286
+ - 512
287
+ - 512
288
+ - 512
289
+ - 512
290
+ LOSS_WEIGHT: 1.0
291
+ MIN_KEYPOINTS_PER_IMAGE: 1
292
+ NAME: KRCNNConvDeconvUpsampleHead
293
+ NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
294
+ NUM_KEYPOINTS: 17
295
+ POOLER_RESOLUTION: 14
296
+ POOLER_SAMPLING_RATIO: 0
297
+ POOLER_TYPE: ROIAlignV2
298
+ ROI_MASK_HEAD:
299
+ CLS_AGNOSTIC_MASK: false
300
+ CONV_DIM: 256
301
+ NAME: MaskRCNNConvUpsampleHead
302
+ NORM: ''
303
+ NUM_CONV: 0
304
+ POOLER_RESOLUTION: 14
305
+ POOLER_SAMPLING_RATIO: 0
306
+ POOLER_TYPE: ROIAlignV2
307
+ RPN:
308
+ BATCH_SIZE_PER_IMAGE: 256
309
+ BBOX_REG_LOSS_TYPE: smooth_l1
310
+ BBOX_REG_LOSS_WEIGHT: 1.0
311
+ BBOX_REG_WEIGHTS: *id002
312
+ BOUNDARY_THRESH: -1
313
+ CONV_DIMS:
314
+ - -1
315
+ HEAD_NAME: StandardRPNHead
316
+ IN_FEATURES:
317
+ - res4
318
+ IOU_LABELS:
319
+ - 0
320
+ - -1
321
+ - 1
322
+ IOU_THRESHOLDS:
323
+ - 0.3
324
+ - 0.7
325
+ LOSS_WEIGHT: 1.0
326
+ NMS_THRESH: 0.7
327
+ POSITIVE_FRACTION: 0.5
328
+ POST_NMS_TOPK_TEST: 1000
329
+ POST_NMS_TOPK_TRAIN: 2000
330
+ PRE_NMS_TOPK_TEST: 6000
331
+ PRE_NMS_TOPK_TRAIN: 12000
332
+ SMOOTH_L1_BETA: 0.0
333
+ SEM_SEG_HEAD:
334
+ ASPP_CHANNELS: 256
335
+ ASPP_DILATIONS:
336
+ - 6
337
+ - 12
338
+ - 18
339
+ ASPP_DROPOUT: 0.1
340
+ COMMON_STRIDE: 4
341
+ CONVS_DIM: 256
342
+ DEFORMABLE_TRANSFORMER_ENCODER_IN_FEATURES:
343
+ - res3
344
+ - res4
345
+ - res5
346
+ DEFORMABLE_TRANSFORMER_ENCODER_N_HEADS: 8
347
+ DEFORMABLE_TRANSFORMER_ENCODER_N_POINTS: 4
348
+ IGNORE_VALUE: 255
349
+ IN_FEATURES:
350
+ - res2
351
+ - res3
352
+ - res4
353
+ - res5
354
+ LOSS_TYPE: hard_pixel_mining
355
+ LOSS_WEIGHT: 1.0
356
+ MASK_DIM: 256
357
+ NAME: MaskFormerHead
358
+ NORM: GN
359
+ NUM_CLASSES: 150
360
+ PIXEL_DECODER_NAME: MSDeformAttnPixelDecoder
361
+ PROJECT_CHANNELS:
362
+ - 48
363
+ PROJECT_FEATURES:
364
+ - res2
365
+ TRANSFORMER_ENC_LAYERS: 6
366
+ USE_DEPTHWISE_SEPARABLE_CONV: false
367
+ SWIN:
368
+ APE: false
369
+ ATTN_DROP_RATE: 0.0
370
+ DEPTHS:
371
+ - 2
372
+ - 2
373
+ - 6
374
+ - 2
375
+ DROP_PATH_RATE: 0.3
376
+ DROP_RATE: 0.0
377
+ EMBED_DIM: 96
378
+ MLP_RATIO: 4.0
379
+ NUM_HEADS:
380
+ - 3
381
+ - 6
382
+ - 12
383
+ - 24
384
+ OUT_FEATURES:
385
+ - res2
386
+ - res3
387
+ - res4
388
+ - res5
389
+ PATCH_NORM: true
390
+ PATCH_SIZE: 4
391
+ PRETRAIN_IMG_SIZE: 224
392
+ QKV_BIAS: true
393
+ QK_SCALE: null
394
+ USE_CHECKPOINT: false
395
+ WINDOW_SIZE: 7
396
+ WEIGHTS: weight/R-50.pkl
397
+ OUTPUT_DIR: ./output/ps/100-5_unordered/step1
398
+ SEED: -1
399
+ SOLVER:
400
+ AMP:
401
+ ENABLED: true
402
+ BACKBONE_MULTIPLIER: 0.1
403
+ BASE_LR: 0.0001
404
+ BASE_LR_END: 0.0
405
+ BIAS_LR_FACTOR: 1.0
406
+ CHECKPOINT_PERIOD: 10000
407
+ CLIP_GRADIENTS:
408
+ CLIP_TYPE: full_model
409
+ CLIP_VALUE: 0.01
410
+ ENABLED: true
411
+ NORM_TYPE: 2.0
412
+ GAMMA: 0.1
413
+ IMS_PER_BATCH: 8
414
+ LR_SCHEDULER_NAME: WarmupMultiStepLR
415
+ MAX_ITER: 160000
416
+ MOMENTUM: 0.9
417
+ NESTEROV: false
418
+ NUM_DECAYS: 3
419
+ OPTIMIZER: ADAMW
420
+ POLY_LR_CONSTANT_ENDING: 0.0
421
+ POLY_LR_POWER: 0.9
422
+ REFERENCE_WORLD_SIZE: 0
423
+ RESCALE_INTERVAL: false
424
+ STEPS:
425
+ - 135000
426
+ - 150000
427
+ WARMUP_FACTOR: 1.0
428
+ WARMUP_ITERS: 0
429
+ WARMUP_METHOD: linear
430
+ WEIGHT_DECAY: 0.05
431
+ WEIGHT_DECAY_BIAS: null
432
+ WEIGHT_DECAY_EMBED: 0.0
433
+ WEIGHT_DECAY_NORM: 0.0
434
+ TEST:
435
+ AUG:
436
+ ENABLED: false
437
+ FLIP: true
438
+ MAX_SIZE: 4480
439
+ MIN_SIZES:
440
+ - 320
441
+ - 480
442
+ - 640
443
+ - 800
444
+ - 960
445
+ - 1120
446
+ DETECTIONS_PER_IMAGE: 100
447
+ EVAL_PERIOD: 2501
448
+ EXPECTED_RESULTS: []
449
+ KEYPOINT_OKS_SIGMAS: []
450
+ PRECISE_BN:
451
+ ENABLED: false
452
+ NUM_ITER: 200
453
+ VERSION: 2
454
+ VIS_PERIOD: 0
ps_100base/step1/fake_query.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52eda6da3faadc3edf8f49262b72efe7687f1b7c27cff55eeea13b824ac4b34d
3
+ size 18331439
ps_100base/step1/last_checkpoint ADDED
@@ -0,0 +1 @@
 
 
1
+ model_final.pth
ps_100base/step1/metrics.json ADDED
The diff for this file is too large to render. See raw diff
 
ps_100base/step1/model_final.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:665de431c48a425616066c4f66f595ba28ca6c7b59e2707be57adee7ac13fec8
3
+ size 534485834
ss_100base/step1/config.yaml ADDED
@@ -0,0 +1,452 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CONT:
2
+ ADD_POS: false
3
+ BASE_CLS: 100
4
+ COLLECT_QUERY_MODE: false
5
+ COMBINE_PSDLABEL: true
6
+ CUMULATIVE_PSDNUM: false
7
+ DISTRIBUTION_ALPHA: 0.5
8
+ FILTER_KD: false
9
+ FREEZE_LABEL: false
10
+ INC_CLS: 5
11
+ KD_DECODER: true
12
+ KD_TEMPERATURE: 1.0
13
+ KD_TEMPERATURE2: 2.0
14
+ KD_TYPE: kl
15
+ KL_ALL: false
16
+ KL_WEIGHT: 2.0
17
+ LIB_SIZE: 80
18
+ MED_TOKENS_WEIGHT: 5.0
19
+ MEMORY: false
20
+ OLD_WEIGHTS: null
21
+ PSD_LABEL_THRESHOLD: 0.0
22
+ PSD_OVERLAP_THRESHOLD: 0.8
23
+ SETTING: overlapped
24
+ TASK: 1
25
+ TOT_CLS: 150
26
+ VQ_NUMBER: 5
27
+ VQ_STORE: false
28
+ WEIGHTED_SAMPLE: true
29
+ WEIGHTS: null
30
+ CUDNN_BENCHMARK: false
31
+ DATALOADER:
32
+ ASPECT_RATIO_GROUPING: true
33
+ FILTER_EMPTY_ANNOTATIONS: true
34
+ NUM_WORKERS: 2
35
+ REPEAT_SQRT: true
36
+ REPEAT_THRESHOLD: 0.0
37
+ SAMPLER_TRAIN: TrainingSampler
38
+ DATASETS:
39
+ PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
40
+ PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
41
+ PROPOSAL_FILES_TEST: []
42
+ PROPOSAL_FILES_TRAIN: []
43
+ TEST:
44
+ - current_ade20k_sem_seg_val
45
+ TRAIN:
46
+ - current_ade20k_sem_seg_train
47
+ GLOBAL:
48
+ HACK: 1.0
49
+ INPUT:
50
+ COLOR_AUG_SSD: true
51
+ CROP:
52
+ ENABLED: true
53
+ SINGLE_CATEGORY_MAX_AREA: 1.0
54
+ SIZE:
55
+ - 512
56
+ - 512
57
+ TYPE: absolute
58
+ DATASET_MAPPER_NAME: continual_semantic
59
+ FORMAT: RGB
60
+ IMAGE_SIZE: 1024
61
+ MASK_FORMAT: polygon
62
+ MAX_SCALE: 2.0
63
+ MAX_SIZE_TEST: 2048
64
+ MAX_SIZE_TRAIN: 2048
65
+ MIN_SCALE: 0.1
66
+ MIN_SIZE_TEST: 512
67
+ MIN_SIZE_TRAIN:
68
+ - 256
69
+ - 307
70
+ - 358
71
+ - 409
72
+ - 460
73
+ - 512
74
+ - 563
75
+ - 614
76
+ - 665
77
+ - 716
78
+ - 768
79
+ - 819
80
+ - 870
81
+ - 921
82
+ - 972
83
+ - 1024
84
+ MIN_SIZE_TRAIN_SAMPLING: choice
85
+ RANDOM_FLIP: horizontal
86
+ SIZE_DIVISIBILITY: 512
87
+ MODEL:
88
+ ANCHOR_GENERATOR:
89
+ ANGLES:
90
+ - - -90
91
+ - 0
92
+ - 90
93
+ ASPECT_RATIOS:
94
+ - - 0.5
95
+ - 1.0
96
+ - 2.0
97
+ NAME: DefaultAnchorGenerator
98
+ OFFSET: 0.0
99
+ SIZES:
100
+ - - 32
101
+ - 64
102
+ - 128
103
+ - 256
104
+ - 512
105
+ BACKBONE:
106
+ FREEZE_AT: 0
107
+ NAME: build_resnet_backbone
108
+ DEVICE: cuda
109
+ FPN:
110
+ FUSE_TYPE: sum
111
+ IN_FEATURES: []
112
+ NORM: ''
113
+ OUT_CHANNELS: 256
114
+ KEYPOINT_ON: false
115
+ LOAD_PROPOSALS: false
116
+ MASK_FORMER:
117
+ CLASS_WEIGHT: 2.0
118
+ CLIP_DIM: 512
119
+ DEC_LAYERS: 10
120
+ DEEP_SUPERVISION: true
121
+ DICE_WEIGHT: 5.0
122
+ DIM_FEEDFORWARD: 2048
123
+ DROPOUT: 0.0
124
+ ENC_LAYERS: 0
125
+ ENFORCE_INPUT_PROJ: false
126
+ HIDDEN_DIM: 256
127
+ IMPORTANCE_SAMPLE_RATIO: 0.75
128
+ MASK_WEIGHT: 5.0
129
+ NHEADS: 8
130
+ NO_OBJECT_WEIGHT: 0.1
131
+ NUM_OBJECT_QUERIES: 100
132
+ OVERSAMPLE_RATIO: 3.0
133
+ PRE_NORM: false
134
+ SIZE_DIVISIBILITY: 32
135
+ TEST:
136
+ INSTANCE_ON: false
137
+ OBJECT_MASK_THRESHOLD: 0.8
138
+ OVERLAP_THRESHOLD: 0.8
139
+ PANOPTIC_ON: false
140
+ SEMANTIC_ON: true
141
+ SEM_SEG_POSTPROCESSING_BEFORE_INFERENCE: false
142
+ TEXT_PATH: ''
143
+ TRAIN_NUM_POINTS: 12544
144
+ TRANSFORMER_DECODER_NAME: MultiScaleMaskedTransformerDecoder
145
+ TRANSFORMER_IN_FEATURE: multi_scale_pixel_decoder
146
+ USE_TEXT_EMBEDDING: false
147
+ MASK_ON: false
148
+ META_ARCHITECTURE: MaskFormer
149
+ PANOPTIC_FPN:
150
+ COMBINE:
151
+ ENABLED: true
152
+ INSTANCES_CONFIDENCE_THRESH: 0.5
153
+ OVERLAP_THRESH: 0.5
154
+ STUFF_AREA_LIMIT: 4096
155
+ INSTANCE_LOSS_WEIGHT: 1.0
156
+ PIXEL_MEAN:
157
+ - 123.675
158
+ - 116.28
159
+ - 103.53
160
+ PIXEL_STD:
161
+ - 58.395
162
+ - 57.12
163
+ - 57.375
164
+ PROPOSAL_GENERATOR:
165
+ MIN_SIZE: 0
166
+ NAME: RPN
167
+ RESNETS:
168
+ DEFORM_MODULATED: false
169
+ DEFORM_NUM_GROUPS: 1
170
+ DEFORM_ON_PER_STAGE:
171
+ - false
172
+ - false
173
+ - false
174
+ - false
175
+ DEPTH: 101
176
+ NORM: FrozenBN
177
+ NUM_GROUPS: 1
178
+ OUT_FEATURES:
179
+ - res2
180
+ - res3
181
+ - res4
182
+ - res5
183
+ RES2_OUT_CHANNELS: 256
184
+ RES4_DILATION: 1
185
+ RES5_DILATION: 1
186
+ RES5_MULTI_GRID:
187
+ - 1
188
+ - 1
189
+ - 1
190
+ STEM_OUT_CHANNELS: 64
191
+ STEM_TYPE: basic
192
+ STRIDE_IN_1X1: false
193
+ WIDTH_PER_GROUP: 64
194
+ RETINANET:
195
+ BBOX_REG_LOSS_TYPE: smooth_l1
196
+ BBOX_REG_WEIGHTS: &id002
197
+ - 1.0
198
+ - 1.0
199
+ - 1.0
200
+ - 1.0
201
+ FOCAL_LOSS_ALPHA: 0.25
202
+ FOCAL_LOSS_GAMMA: 2.0
203
+ IN_FEATURES:
204
+ - p3
205
+ - p4
206
+ - p5
207
+ - p6
208
+ - p7
209
+ IOU_LABELS:
210
+ - 0
211
+ - -1
212
+ - 1
213
+ IOU_THRESHOLDS:
214
+ - 0.4
215
+ - 0.5
216
+ NMS_THRESH_TEST: 0.5
217
+ NORM: ''
218
+ NUM_CLASSES: 80
219
+ NUM_CONVS: 4
220
+ PRIOR_PROB: 0.01
221
+ SCORE_THRESH_TEST: 0.05
222
+ SMOOTH_L1_LOSS_BETA: 0.1
223
+ TOPK_CANDIDATES_TEST: 1000
224
+ ROI_BOX_CASCADE_HEAD:
225
+ BBOX_REG_WEIGHTS:
226
+ - &id001
227
+ - 10.0
228
+ - 10.0
229
+ - 5.0
230
+ - 5.0
231
+ - - 20.0
232
+ - 20.0
233
+ - 10.0
234
+ - 10.0
235
+ - - 30.0
236
+ - 30.0
237
+ - 15.0
238
+ - 15.0
239
+ IOUS:
240
+ - 0.5
241
+ - 0.6
242
+ - 0.7
243
+ ROI_BOX_HEAD:
244
+ BBOX_REG_LOSS_TYPE: smooth_l1
245
+ BBOX_REG_LOSS_WEIGHT: 1.0
246
+ BBOX_REG_WEIGHTS: *id001
247
+ CLS_AGNOSTIC_BBOX_REG: false
248
+ CONV_DIM: 256
249
+ FC_DIM: 1024
250
+ FED_LOSS_FREQ_WEIGHT_POWER: 0.5
251
+ FED_LOSS_NUM_CLASSES: 50
252
+ NAME: ''
253
+ NORM: ''
254
+ NUM_CONV: 0
255
+ NUM_FC: 0
256
+ POOLER_RESOLUTION: 14
257
+ POOLER_SAMPLING_RATIO: 0
258
+ POOLER_TYPE: ROIAlignV2
259
+ SMOOTH_L1_BETA: 0.0
260
+ TRAIN_ON_PRED_BOXES: false
261
+ USE_FED_LOSS: false
262
+ USE_SIGMOID_CE: false
263
+ ROI_HEADS:
264
+ BATCH_SIZE_PER_IMAGE: 512
265
+ IN_FEATURES:
266
+ - res4
267
+ IOU_LABELS:
268
+ - 0
269
+ - 1
270
+ IOU_THRESHOLDS:
271
+ - 0.5
272
+ NAME: Res5ROIHeads
273
+ NMS_THRESH_TEST: 0.5
274
+ NUM_CLASSES: 80
275
+ POSITIVE_FRACTION: 0.25
276
+ PROPOSAL_APPEND_GT: true
277
+ SCORE_THRESH_TEST: 0.05
278
+ ROI_KEYPOINT_HEAD:
279
+ CONV_DIMS:
280
+ - 512
281
+ - 512
282
+ - 512
283
+ - 512
284
+ - 512
285
+ - 512
286
+ - 512
287
+ - 512
288
+ LOSS_WEIGHT: 1.0
289
+ MIN_KEYPOINTS_PER_IMAGE: 1
290
+ NAME: KRCNNConvDeconvUpsampleHead
291
+ NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
292
+ NUM_KEYPOINTS: 17
293
+ POOLER_RESOLUTION: 14
294
+ POOLER_SAMPLING_RATIO: 0
295
+ POOLER_TYPE: ROIAlignV2
296
+ ROI_MASK_HEAD:
297
+ CLS_AGNOSTIC_MASK: false
298
+ CONV_DIM: 256
299
+ NAME: MaskRCNNConvUpsampleHead
300
+ NORM: ''
301
+ NUM_CONV: 0
302
+ POOLER_RESOLUTION: 14
303
+ POOLER_SAMPLING_RATIO: 0
304
+ POOLER_TYPE: ROIAlignV2
305
+ RPN:
306
+ BATCH_SIZE_PER_IMAGE: 256
307
+ BBOX_REG_LOSS_TYPE: smooth_l1
308
+ BBOX_REG_LOSS_WEIGHT: 1.0
309
+ BBOX_REG_WEIGHTS: *id002
310
+ BOUNDARY_THRESH: -1
311
+ CONV_DIMS:
312
+ - -1
313
+ HEAD_NAME: StandardRPNHead
314
+ IN_FEATURES:
315
+ - res4
316
+ IOU_LABELS:
317
+ - 0
318
+ - -1
319
+ - 1
320
+ IOU_THRESHOLDS:
321
+ - 0.3
322
+ - 0.7
323
+ LOSS_WEIGHT: 1.0
324
+ NMS_THRESH: 0.7
325
+ POSITIVE_FRACTION: 0.5
326
+ POST_NMS_TOPK_TEST: 1000
327
+ POST_NMS_TOPK_TRAIN: 2000
328
+ PRE_NMS_TOPK_TEST: 6000
329
+ PRE_NMS_TOPK_TRAIN: 12000
330
+ SMOOTH_L1_BETA: 0.0
331
+ SEM_SEG_HEAD:
332
+ ASPP_CHANNELS: 256
333
+ ASPP_DILATIONS:
334
+ - 6
335
+ - 12
336
+ - 18
337
+ ASPP_DROPOUT: 0.1
338
+ COMMON_STRIDE: 4
339
+ CONVS_DIM: 256
340
+ DEFORMABLE_TRANSFORMER_ENCODER_IN_FEATURES:
341
+ - res3
342
+ - res4
343
+ - res5
344
+ DEFORMABLE_TRANSFORMER_ENCODER_N_HEADS: 8
345
+ DEFORMABLE_TRANSFORMER_ENCODER_N_POINTS: 4
346
+ IGNORE_VALUE: 255
347
+ IN_FEATURES:
348
+ - res2
349
+ - res3
350
+ - res4
351
+ - res5
352
+ LOSS_TYPE: hard_pixel_mining
353
+ LOSS_WEIGHT: 1.0
354
+ MASK_DIM: 256
355
+ NAME: MaskFormerHead
356
+ NORM: GN
357
+ NUM_CLASSES: 150
358
+ PIXEL_DECODER_NAME: MSDeformAttnPixelDecoder
359
+ PROJECT_CHANNELS:
360
+ - 48
361
+ PROJECT_FEATURES:
362
+ - res2
363
+ TRANSFORMER_ENC_LAYERS: 6
364
+ USE_DEPTHWISE_SEPARABLE_CONV: false
365
+ SWIN:
366
+ APE: false
367
+ ATTN_DROP_RATE: 0.0
368
+ DEPTHS:
369
+ - 2
370
+ - 2
371
+ - 6
372
+ - 2
373
+ DROP_PATH_RATE: 0.3
374
+ DROP_RATE: 0.0
375
+ EMBED_DIM: 96
376
+ MLP_RATIO: 4.0
377
+ NUM_HEADS:
378
+ - 3
379
+ - 6
380
+ - 12
381
+ - 24
382
+ OUT_FEATURES:
383
+ - res2
384
+ - res3
385
+ - res4
386
+ - res5
387
+ PATCH_NORM: true
388
+ PATCH_SIZE: 4
389
+ PRETRAIN_IMG_SIZE: 224
390
+ QKV_BIAS: true
391
+ QK_SCALE: null
392
+ USE_CHECKPOINT: false
393
+ WINDOW_SIZE: 7
394
+ WEIGHTS: weight/R-101.pkl
395
+ OUTPUT_DIR: /storage/data/zhuyuchen530/ss/100_base/step1
396
+ SEED: -1
397
+ SOLVER:
398
+ AMP:
399
+ ENABLED: true
400
+ BACKBONE_MULTIPLIER: 0.1
401
+ BASE_LR: 0.0001
402
+ BASE_LR_END: 0.0
403
+ BIAS_LR_FACTOR: 1.0
404
+ CHECKPOINT_PERIOD: 50000
405
+ CLIP_GRADIENTS:
406
+ CLIP_TYPE: full_model
407
+ CLIP_VALUE: 0.01
408
+ ENABLED: true
409
+ NORM_TYPE: 2.0
410
+ GAMMA: 0.1
411
+ IMS_PER_BATCH: 8
412
+ LR_SCHEDULER_NAME: WarmupMultiStepLR
413
+ MAX_ITER: 160000
414
+ MOMENTUM: 0.9
415
+ NESTEROV: false
416
+ NUM_DECAYS: 3
417
+ OPTIMIZER: ADAMW
418
+ POLY_LR_CONSTANT_ENDING: 0.0
419
+ POLY_LR_POWER: 0.9
420
+ REFERENCE_WORLD_SIZE: 0
421
+ RESCALE_INTERVAL: false
422
+ STEPS:
423
+ - 135000
424
+ - 150000
425
+ WARMUP_FACTOR: 1.0
426
+ WARMUP_ITERS: 0
427
+ WARMUP_METHOD: linear
428
+ WEIGHT_DECAY: 0.05
429
+ WEIGHT_DECAY_BIAS: null
430
+ WEIGHT_DECAY_EMBED: 0.0
431
+ WEIGHT_DECAY_NORM: 0.0
432
+ TEST:
433
+ AUG:
434
+ ENABLED: false
435
+ FLIP: true
436
+ MAX_SIZE: 3584
437
+ MIN_SIZES:
438
+ - 256
439
+ - 384
440
+ - 512
441
+ - 640
442
+ - 768
443
+ - 896
444
+ DETECTIONS_PER_IMAGE: 100
445
+ EVAL_PERIOD: 10000
446
+ EXPECTED_RESULTS: []
447
+ KEYPOINT_OKS_SIGMAS: []
448
+ PRECISE_BN:
449
+ ENABLED: false
450
+ NUM_ITER: 200
451
+ VERSION: 2
452
+ VIS_PERIOD: 0
ss_100base/step1/fake_query.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5a9bbe09ab438914642d3bb840f240de8648fac51620d0ba6fd600f7f4bf856
3
+ size 18682863
ss_100base/step1/last_checkpoint ADDED
@@ -0,0 +1 @@
 
 
1
+ model_final.pth
ss_100base/step1/metrics.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:423de8296f1c39950dd58c98f370aa5538f09b7cd125a6625d52ea0a49044402
3
+ size 15435801
ss_100base/step1/model_final.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdf8eb7ef35161c23ec28ff2abee1681c43b9224242abe18abe14b31cd1df7d8
3
+ size 762309797