SimCIS / ps_100base /step1 /config.yaml
LightningNO1's picture
Upload folder using huggingface_hub
4c86dc8 verified
CONT:
ADD_POS: false
BASE_CLS: 100
COLLECT_QUERY_MODE: false
COMBINE_PSDLABEL: false
CUMULATIVE_PSDNUM: false
DISTRIBUTION_ALPHA: 0.5
FILTER_KD: false
FREEZE_LABEL: false
INC_CLS: 5
KD_DECODER: true
KD_TEMPERATURE: 1.0
KD_TEMPERATURE2: 1.0
KD_TYPE: kl
KL_ALL: true
KL_WEIGHT: 2.0
LIB_SIZE: 80
MED_TOKENS_WEIGHT: 5.0
MEMORY: false
MPATH: memory/pan
OLD_MODEL: true
OLD_WEIGHTS: null
PSD_LABEL_THRESHOLD: 0.35
PSD_OVERLAP_THRESHOLD: 0.8
SETTING: overlapped
TASK: 1
TOT_CLS: 150
VQ_NUMBER: 3
VQ_STORE: false
WEIGHTED_SAMPLE: true
WEIGHTS: null
CUDNN_BENCHMARK: false
DATALOADER:
ASPECT_RATIO_GROUPING: true
FILTER_EMPTY_ANNOTATIONS: true
NUM_WORKERS: 2
REPEAT_SQRT: true
REPEAT_THRESHOLD: 0.0
SAMPLER_TRAIN: TrainingSampler
DATASETS:
PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
PROPOSAL_FILES_TEST: []
PROPOSAL_FILES_TRAIN: []
TEST:
- current_ade20k_panoptic_val
TRAIN:
- current_ade20k_panoptic_train
GLOBAL:
HACK: 1.0
INPUT:
COLOR_AUG_SSD: true
CROP:
ENABLED: true
SINGLE_CATEGORY_MAX_AREA: 1.0
SIZE:
- 640
- 640
TYPE: absolute
DATASET_MAPPER_NAME: continual_panoptic
FORMAT: RGB
IMAGE_SIZE: 1024
MASK_FORMAT: polygon
MAX_SCALE: 2.0
MAX_SIZE_TEST: 2560
MAX_SIZE_TRAIN: 2560
MIN_SCALE: 0.1
MIN_SIZE_TEST: 640
MIN_SIZE_TRAIN:
- 320
- 384
- 448
- 512
- 576
- 640
- 704
- 768
- 832
- 896
- 960
- 1024
- 1088
- 1152
- 1216
- 1280
MIN_SIZE_TRAIN_SAMPLING: choice
RANDOM_FLIP: horizontal
SIZE_DIVISIBILITY: 640
MODEL:
ANCHOR_GENERATOR:
ANGLES:
- - -90
- 0
- 90
ASPECT_RATIOS:
- - 0.5
- 1.0
- 2.0
NAME: DefaultAnchorGenerator
OFFSET: 0.0
SIZES:
- - 32
- 64
- 128
- 256
- 512
BACKBONE:
FREEZE_AT: 0
NAME: build_resnet_backbone
DEVICE: cuda
FPN:
FUSE_TYPE: sum
IN_FEATURES: []
NORM: ''
OUT_CHANNELS: 256
KEYPOINT_ON: false
LOAD_PROPOSALS: false
MASK_FORMER:
CLASS_WEIGHT: 4.0
CLIP_DIM: 768
DEC_LAYERS: 10
DEEP_SUPERVISION: true
DICE_WEIGHT: 5.0
DIM_FEEDFORWARD: 2048
DROPOUT: 0.0
ENC_LAYERS: 0
ENFORCE_INPUT_PROJ: false
HIDDEN_DIM: 256
IMPORTANCE_SAMPLE_RATIO: 0.75
MASK_WEIGHT: 5.0
NHEADS: 8
NO_OBJECT_WEIGHT: 0.1
NUM_OBJECT_QUERIES: 100
OVERSAMPLE_RATIO: 3.0
PRE_NORM: false
SIZE_DIVISIBILITY: 32
TEST:
INSTANCE_ON: true
OBJECT_MASK_THRESHOLD: 0.25
OVERLAP_THRESHOLD: 0.8
PANOPTIC_ON: true
SEMANTIC_ON: true
SEM_SEG_POSTPROCESSING_BEFORE_INFERENCE: false
TEXT_PATH: label_embedding/ade20k_150_laion768_all.npy
TRAIN_NUM_POINTS: 12544
TRANSFORMER_DECODER_NAME: MultiScaleMaskedTransformerDecoder
TRANSFORMER_IN_FEATURE: multi_scale_pixel_decoder
USE_TEXT_EMBEDDING: false
MASK_ON: false
META_ARCHITECTURE: MaskFormer
PANOPTIC_FPN:
COMBINE:
ENABLED: true
INSTANCES_CONFIDENCE_THRESH: 0.5
OVERLAP_THRESH: 0.5
STUFF_AREA_LIMIT: 4096
INSTANCE_LOSS_WEIGHT: 1.0
PIXEL_MEAN:
- 123.675
- 116.28
- 103.53
PIXEL_STD:
- 58.395
- 57.12
- 57.375
PROPOSAL_GENERATOR:
MIN_SIZE: 0
NAME: RPN
RESNETS:
DEFORM_MODULATED: false
DEFORM_NUM_GROUPS: 1
DEFORM_ON_PER_STAGE:
- false
- false
- false
- false
DEPTH: 50
NORM: FrozenBN
NUM_GROUPS: 1
OUT_FEATURES:
- res2
- res3
- res4
- res5
RES2_OUT_CHANNELS: 256
RES4_DILATION: 1
RES5_DILATION: 1
RES5_MULTI_GRID:
- 1
- 1
- 1
STEM_OUT_CHANNELS: 64
STEM_TYPE: basic
STRIDE_IN_1X1: false
WIDTH_PER_GROUP: 64
RETINANET:
BBOX_REG_LOSS_TYPE: smooth_l1
BBOX_REG_WEIGHTS: &id002
- 1.0
- 1.0
- 1.0
- 1.0
FOCAL_LOSS_ALPHA: 0.25
FOCAL_LOSS_GAMMA: 2.0
IN_FEATURES:
- p3
- p4
- p5
- p6
- p7
IOU_LABELS:
- 0
- -1
- 1
IOU_THRESHOLDS:
- 0.4
- 0.5
NMS_THRESH_TEST: 0.5
NORM: ''
NUM_CLASSES: 80
NUM_CONVS: 4
PRIOR_PROB: 0.01
SCORE_THRESH_TEST: 0.05
SMOOTH_L1_LOSS_BETA: 0.1
TOPK_CANDIDATES_TEST: 1000
ROI_BOX_CASCADE_HEAD:
BBOX_REG_WEIGHTS:
- &id001
- 10.0
- 10.0
- 5.0
- 5.0
- - 20.0
- 20.0
- 10.0
- 10.0
- - 30.0
- 30.0
- 15.0
- 15.0
IOUS:
- 0.5
- 0.6
- 0.7
ROI_BOX_HEAD:
BBOX_REG_LOSS_TYPE: smooth_l1
BBOX_REG_LOSS_WEIGHT: 1.0
BBOX_REG_WEIGHTS: *id001
CLS_AGNOSTIC_BBOX_REG: false
CONV_DIM: 256
FC_DIM: 1024
FED_LOSS_FREQ_WEIGHT_POWER: 0.5
FED_LOSS_NUM_CLASSES: 50
NAME: ''
NORM: ''
NUM_CONV: 0
NUM_FC: 0
POOLER_RESOLUTION: 14
POOLER_SAMPLING_RATIO: 0
POOLER_TYPE: ROIAlignV2
SMOOTH_L1_BETA: 0.0
TRAIN_ON_PRED_BOXES: false
USE_FED_LOSS: false
USE_SIGMOID_CE: false
ROI_HEADS:
BATCH_SIZE_PER_IMAGE: 512
IN_FEATURES:
- res4
IOU_LABELS:
- 0
- 1
IOU_THRESHOLDS:
- 0.5
NAME: Res5ROIHeads
NMS_THRESH_TEST: 0.5
NUM_CLASSES: 80
POSITIVE_FRACTION: 0.25
PROPOSAL_APPEND_GT: true
SCORE_THRESH_TEST: 0.05
ROI_KEYPOINT_HEAD:
CONV_DIMS:
- 512
- 512
- 512
- 512
- 512
- 512
- 512
- 512
LOSS_WEIGHT: 1.0
MIN_KEYPOINTS_PER_IMAGE: 1
NAME: KRCNNConvDeconvUpsampleHead
NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
NUM_KEYPOINTS: 17
POOLER_RESOLUTION: 14
POOLER_SAMPLING_RATIO: 0
POOLER_TYPE: ROIAlignV2
ROI_MASK_HEAD:
CLS_AGNOSTIC_MASK: false
CONV_DIM: 256
NAME: MaskRCNNConvUpsampleHead
NORM: ''
NUM_CONV: 0
POOLER_RESOLUTION: 14
POOLER_SAMPLING_RATIO: 0
POOLER_TYPE: ROIAlignV2
RPN:
BATCH_SIZE_PER_IMAGE: 256
BBOX_REG_LOSS_TYPE: smooth_l1
BBOX_REG_LOSS_WEIGHT: 1.0
BBOX_REG_WEIGHTS: *id002
BOUNDARY_THRESH: -1
CONV_DIMS:
- -1
HEAD_NAME: StandardRPNHead
IN_FEATURES:
- res4
IOU_LABELS:
- 0
- -1
- 1
IOU_THRESHOLDS:
- 0.3
- 0.7
LOSS_WEIGHT: 1.0
NMS_THRESH: 0.7
POSITIVE_FRACTION: 0.5
POST_NMS_TOPK_TEST: 1000
POST_NMS_TOPK_TRAIN: 2000
PRE_NMS_TOPK_TEST: 6000
PRE_NMS_TOPK_TRAIN: 12000
SMOOTH_L1_BETA: 0.0
SEM_SEG_HEAD:
ASPP_CHANNELS: 256
ASPP_DILATIONS:
- 6
- 12
- 18
ASPP_DROPOUT: 0.1
COMMON_STRIDE: 4
CONVS_DIM: 256
DEFORMABLE_TRANSFORMER_ENCODER_IN_FEATURES:
- res3
- res4
- res5
DEFORMABLE_TRANSFORMER_ENCODER_N_HEADS: 8
DEFORMABLE_TRANSFORMER_ENCODER_N_POINTS: 4
IGNORE_VALUE: 255
IN_FEATURES:
- res2
- res3
- res4
- res5
LOSS_TYPE: hard_pixel_mining
LOSS_WEIGHT: 1.0
MASK_DIM: 256
NAME: MaskFormerHead
NORM: GN
NUM_CLASSES: 150
PIXEL_DECODER_NAME: MSDeformAttnPixelDecoder
PROJECT_CHANNELS:
- 48
PROJECT_FEATURES:
- res2
TRANSFORMER_ENC_LAYERS: 6
USE_DEPTHWISE_SEPARABLE_CONV: false
SWIN:
APE: false
ATTN_DROP_RATE: 0.0
DEPTHS:
- 2
- 2
- 6
- 2
DROP_PATH_RATE: 0.3
DROP_RATE: 0.0
EMBED_DIM: 96
MLP_RATIO: 4.0
NUM_HEADS:
- 3
- 6
- 12
- 24
OUT_FEATURES:
- res2
- res3
- res4
- res5
PATCH_NORM: true
PATCH_SIZE: 4
PRETRAIN_IMG_SIZE: 224
QKV_BIAS: true
QK_SCALE: null
USE_CHECKPOINT: false
WINDOW_SIZE: 7
WEIGHTS: weight/R-50.pkl
OUTPUT_DIR: ./output/ps/100-5_unordered/step1
SEED: -1
SOLVER:
AMP:
ENABLED: true
BACKBONE_MULTIPLIER: 0.1
BASE_LR: 0.0001
BASE_LR_END: 0.0
BIAS_LR_FACTOR: 1.0
CHECKPOINT_PERIOD: 10000
CLIP_GRADIENTS:
CLIP_TYPE: full_model
CLIP_VALUE: 0.01
ENABLED: true
NORM_TYPE: 2.0
GAMMA: 0.1
IMS_PER_BATCH: 8
LR_SCHEDULER_NAME: WarmupMultiStepLR
MAX_ITER: 160000
MOMENTUM: 0.9
NESTEROV: false
NUM_DECAYS: 3
OPTIMIZER: ADAMW
POLY_LR_CONSTANT_ENDING: 0.0
POLY_LR_POWER: 0.9
REFERENCE_WORLD_SIZE: 0
RESCALE_INTERVAL: false
STEPS:
- 135000
- 150000
WARMUP_FACTOR: 1.0
WARMUP_ITERS: 0
WARMUP_METHOD: linear
WEIGHT_DECAY: 0.05
WEIGHT_DECAY_BIAS: null
WEIGHT_DECAY_EMBED: 0.0
WEIGHT_DECAY_NORM: 0.0
TEST:
AUG:
ENABLED: false
FLIP: true
MAX_SIZE: 4480
MIN_SIZES:
- 320
- 480
- 640
- 800
- 960
- 1120
DETECTIONS_PER_IMAGE: 100
EVAL_PERIOD: 2501
EXPECTED_RESULTS: []
KEYPOINT_OKS_SIGMAS: []
PRECISE_BN:
ENABLED: false
NUM_ITER: 200
VERSION: 2
VIS_PERIOD: 0