|
|
@@ -1,351 +0,0 @@
|
|
|
-AUG:
|
|
|
- DETR: true
|
|
|
-CACHE_DIR: ~/cache/huggingface
|
|
|
-CUDNN_BENCHMARK: false
|
|
|
-DATALOADER:
|
|
|
- ASPECT_RATIO_GROUPING: true
|
|
|
- FILTER_EMPTY_ANNOTATIONS: false
|
|
|
- NUM_WORKERS: 4
|
|
|
- REPEAT_THRESHOLD: 0.0
|
|
|
- SAMPLER_TRAIN: TrainingSampler
|
|
|
-DATASETS:
|
|
|
- PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
|
|
|
- PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
|
|
|
- PROPOSAL_FILES_TEST: []
|
|
|
- PROPOSAL_FILES_TRAIN: []
|
|
|
- TEST:
|
|
|
- - scihub_train
|
|
|
- TRAIN:
|
|
|
- - scihub_train
|
|
|
-GLOBAL:
|
|
|
- HACK: 1.0
|
|
|
-ICDAR_DATA_DIR_TEST: ''
|
|
|
-ICDAR_DATA_DIR_TRAIN: ''
|
|
|
-INPUT:
|
|
|
- CROP:
|
|
|
- ENABLED: true
|
|
|
- SIZE:
|
|
|
- - 384
|
|
|
- - 600
|
|
|
- TYPE: absolute_range
|
|
|
- FORMAT: RGB
|
|
|
- MASK_FORMAT: polygon
|
|
|
- MAX_SIZE_TEST: 1333
|
|
|
- MAX_SIZE_TRAIN: 1333
|
|
|
- MIN_SIZE_TEST: 800
|
|
|
- MIN_SIZE_TRAIN:
|
|
|
- - 480
|
|
|
- - 512
|
|
|
- - 544
|
|
|
- - 576
|
|
|
- - 608
|
|
|
- - 640
|
|
|
- - 672
|
|
|
- - 704
|
|
|
- - 736
|
|
|
- - 768
|
|
|
- - 800
|
|
|
- MIN_SIZE_TRAIN_SAMPLING: choice
|
|
|
- RANDOM_FLIP: horizontal
|
|
|
-MODEL:
|
|
|
- ANCHOR_GENERATOR:
|
|
|
- ANGLES:
|
|
|
- - - -90
|
|
|
- - 0
|
|
|
- - 90
|
|
|
- ASPECT_RATIOS:
|
|
|
- - - 0.5
|
|
|
- - 1.0
|
|
|
- - 2.0
|
|
|
- NAME: DefaultAnchorGenerator
|
|
|
- OFFSET: 0.0
|
|
|
- SIZES:
|
|
|
- - - 32
|
|
|
- - - 64
|
|
|
- - - 128
|
|
|
- - - 256
|
|
|
- - - 512
|
|
|
- BACKBONE:
|
|
|
- FREEZE_AT: 2
|
|
|
- NAME: build_vit_fpn_backbone
|
|
|
- CONFIG_PATH: ''
|
|
|
- DEVICE: cuda
|
|
|
- FPN:
|
|
|
- FUSE_TYPE: sum
|
|
|
- IN_FEATURES:
|
|
|
- - layer3
|
|
|
- - layer5
|
|
|
- - layer7
|
|
|
- - layer11
|
|
|
- NORM: ''
|
|
|
- OUT_CHANNELS: 256
|
|
|
- IMAGE_ONLY: true
|
|
|
- KEYPOINT_ON: false
|
|
|
- LOAD_PROPOSALS: false
|
|
|
- MASK_ON: true
|
|
|
- META_ARCHITECTURE: VLGeneralizedRCNN
|
|
|
- PANOPTIC_FPN:
|
|
|
- COMBINE:
|
|
|
- ENABLED: true
|
|
|
- INSTANCES_CONFIDENCE_THRESH: 0.5
|
|
|
- OVERLAP_THRESH: 0.5
|
|
|
- STUFF_AREA_LIMIT: 4096
|
|
|
- INSTANCE_LOSS_WEIGHT: 1.0
|
|
|
- PIXEL_MEAN:
|
|
|
- - 127.5
|
|
|
- - 127.5
|
|
|
- - 127.5
|
|
|
- PIXEL_STD:
|
|
|
- - 127.5
|
|
|
- - 127.5
|
|
|
- - 127.5
|
|
|
- PROPOSAL_GENERATOR:
|
|
|
- MIN_SIZE: 0
|
|
|
- NAME: RPN
|
|
|
- RESNETS:
|
|
|
- DEFORM_MODULATED: false
|
|
|
- DEFORM_NUM_GROUPS: 1
|
|
|
- DEFORM_ON_PER_STAGE:
|
|
|
- - false
|
|
|
- - false
|
|
|
- - false
|
|
|
- - false
|
|
|
- DEPTH: 50
|
|
|
- NORM: FrozenBN
|
|
|
- NUM_GROUPS: 1
|
|
|
- OUT_FEATURES:
|
|
|
- - res4
|
|
|
- RES2_OUT_CHANNELS: 256
|
|
|
- RES5_DILATION: 1
|
|
|
- STEM_OUT_CHANNELS: 64
|
|
|
- STRIDE_IN_1X1: true
|
|
|
- WIDTH_PER_GROUP: 64
|
|
|
- RETINANET:
|
|
|
- BBOX_REG_LOSS_TYPE: smooth_l1
|
|
|
- BBOX_REG_WEIGHTS:
|
|
|
- - 1.0
|
|
|
- - 1.0
|
|
|
- - 1.0
|
|
|
- - 1.0
|
|
|
- FOCAL_LOSS_ALPHA: 0.25
|
|
|
- FOCAL_LOSS_GAMMA: 2.0
|
|
|
- IN_FEATURES:
|
|
|
- - p3
|
|
|
- - p4
|
|
|
- - p5
|
|
|
- - p6
|
|
|
- - p7
|
|
|
- IOU_LABELS:
|
|
|
- - 0
|
|
|
- - -1
|
|
|
- - 1
|
|
|
- IOU_THRESHOLDS:
|
|
|
- - 0.4
|
|
|
- - 0.5
|
|
|
- NMS_THRESH_TEST: 0.5
|
|
|
- NORM: ''
|
|
|
- NUM_CLASSES: 10
|
|
|
- NUM_CONVS: 4
|
|
|
- PRIOR_PROB: 0.01
|
|
|
- SCORE_THRESH_TEST: 0.05
|
|
|
- SMOOTH_L1_LOSS_BETA: 0.1
|
|
|
- TOPK_CANDIDATES_TEST: 1000
|
|
|
- ROI_BOX_CASCADE_HEAD:
|
|
|
- BBOX_REG_WEIGHTS:
|
|
|
- - - 10.0
|
|
|
- - 10.0
|
|
|
- - 5.0
|
|
|
- - 5.0
|
|
|
- - - 20.0
|
|
|
- - 20.0
|
|
|
- - 10.0
|
|
|
- - 10.0
|
|
|
- - - 30.0
|
|
|
- - 30.0
|
|
|
- - 15.0
|
|
|
- - 15.0
|
|
|
- IOUS:
|
|
|
- - 0.5
|
|
|
- - 0.6
|
|
|
- - 0.7
|
|
|
- ROI_BOX_HEAD:
|
|
|
- BBOX_REG_LOSS_TYPE: smooth_l1
|
|
|
- BBOX_REG_LOSS_WEIGHT: 1.0
|
|
|
- BBOX_REG_WEIGHTS:
|
|
|
- - 10.0
|
|
|
- - 10.0
|
|
|
- - 5.0
|
|
|
- - 5.0
|
|
|
- CLS_AGNOSTIC_BBOX_REG: true
|
|
|
- CONV_DIM: 256
|
|
|
- FC_DIM: 1024
|
|
|
- NAME: FastRCNNConvFCHead
|
|
|
- NORM: ''
|
|
|
- NUM_CONV: 0
|
|
|
- NUM_FC: 2
|
|
|
- POOLER_RESOLUTION: 7
|
|
|
- POOLER_SAMPLING_RATIO: 0
|
|
|
- POOLER_TYPE: ROIAlignV2
|
|
|
- SMOOTH_L1_BETA: 0.0
|
|
|
- TRAIN_ON_PRED_BOXES: false
|
|
|
- ROI_HEADS:
|
|
|
- BATCH_SIZE_PER_IMAGE: 512
|
|
|
- IN_FEATURES:
|
|
|
- - p2
|
|
|
- - p3
|
|
|
- - p4
|
|
|
- - p5
|
|
|
- IOU_LABELS:
|
|
|
- - 0
|
|
|
- - 1
|
|
|
- IOU_THRESHOLDS:
|
|
|
- - 0.5
|
|
|
- NAME: CascadeROIHeads
|
|
|
- NMS_THRESH_TEST: 0.5
|
|
|
- NUM_CLASSES: 10
|
|
|
- POSITIVE_FRACTION: 0.25
|
|
|
- PROPOSAL_APPEND_GT: true
|
|
|
- SCORE_THRESH_TEST: 0.05
|
|
|
- ROI_KEYPOINT_HEAD:
|
|
|
- CONV_DIMS:
|
|
|
- - 512
|
|
|
- - 512
|
|
|
- - 512
|
|
|
- - 512
|
|
|
- - 512
|
|
|
- - 512
|
|
|
- - 512
|
|
|
- - 512
|
|
|
- LOSS_WEIGHT: 1.0
|
|
|
- MIN_KEYPOINTS_PER_IMAGE: 1
|
|
|
- NAME: KRCNNConvDeconvUpsampleHead
|
|
|
- NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
|
|
|
- NUM_KEYPOINTS: 17
|
|
|
- POOLER_RESOLUTION: 14
|
|
|
- POOLER_SAMPLING_RATIO: 0
|
|
|
- POOLER_TYPE: ROIAlignV2
|
|
|
- ROI_MASK_HEAD:
|
|
|
- CLS_AGNOSTIC_MASK: false
|
|
|
- CONV_DIM: 256
|
|
|
- NAME: MaskRCNNConvUpsampleHead
|
|
|
- NORM: ''
|
|
|
- NUM_CONV: 4
|
|
|
- POOLER_RESOLUTION: 14
|
|
|
- POOLER_SAMPLING_RATIO: 0
|
|
|
- POOLER_TYPE: ROIAlignV2
|
|
|
- RPN:
|
|
|
- BATCH_SIZE_PER_IMAGE: 256
|
|
|
- BBOX_REG_LOSS_TYPE: smooth_l1
|
|
|
- BBOX_REG_LOSS_WEIGHT: 1.0
|
|
|
- BBOX_REG_WEIGHTS:
|
|
|
- - 1.0
|
|
|
- - 1.0
|
|
|
- - 1.0
|
|
|
- - 1.0
|
|
|
- BOUNDARY_THRESH: -1
|
|
|
- CONV_DIMS:
|
|
|
- - -1
|
|
|
- HEAD_NAME: StandardRPNHead
|
|
|
- IN_FEATURES:
|
|
|
- - p2
|
|
|
- - p3
|
|
|
- - p4
|
|
|
- - p5
|
|
|
- - p6
|
|
|
- IOU_LABELS:
|
|
|
- - 0
|
|
|
- - -1
|
|
|
- - 1
|
|
|
- IOU_THRESHOLDS:
|
|
|
- - 0.3
|
|
|
- - 0.7
|
|
|
- LOSS_WEIGHT: 1.0
|
|
|
- NMS_THRESH: 0.7
|
|
|
- POSITIVE_FRACTION: 0.5
|
|
|
- POST_NMS_TOPK_TEST: 1000
|
|
|
- POST_NMS_TOPK_TRAIN: 2000
|
|
|
- PRE_NMS_TOPK_TEST: 1000
|
|
|
- PRE_NMS_TOPK_TRAIN: 2000
|
|
|
- SMOOTH_L1_BETA: 0.0
|
|
|
- SEM_SEG_HEAD:
|
|
|
- COMMON_STRIDE: 4
|
|
|
- CONVS_DIM: 128
|
|
|
- IGNORE_VALUE: 255
|
|
|
- IN_FEATURES:
|
|
|
- - p2
|
|
|
- - p3
|
|
|
- - p4
|
|
|
- - p5
|
|
|
- LOSS_WEIGHT: 1.0
|
|
|
- NAME: SemSegFPNHead
|
|
|
- NORM: GN
|
|
|
- NUM_CLASSES: 10
|
|
|
- VIT:
|
|
|
- DROP_PATH: 0.1
|
|
|
- IMG_SIZE:
|
|
|
- - 224
|
|
|
- - 224
|
|
|
- NAME: layoutlmv3_base
|
|
|
- OUT_FEATURES:
|
|
|
- - layer3
|
|
|
- - layer5
|
|
|
- - layer7
|
|
|
- - layer11
|
|
|
- POS_TYPE: abs
|
|
|
- WEIGHTS:
|
|
|
-OUTPUT_DIR:
|
|
|
-SCIHUB_DATA_DIR_TRAIN: ~/publaynet/layout_scihub/train
|
|
|
-SEED: 42
|
|
|
-SOLVER:
|
|
|
- AMP:
|
|
|
- ENABLED: true
|
|
|
- BACKBONE_MULTIPLIER: 1.0
|
|
|
- BASE_LR: 0.0002
|
|
|
- BIAS_LR_FACTOR: 1.0
|
|
|
- CHECKPOINT_PERIOD: 2000
|
|
|
- CLIP_GRADIENTS:
|
|
|
- CLIP_TYPE: full_model
|
|
|
- CLIP_VALUE: 1.0
|
|
|
- ENABLED: true
|
|
|
- NORM_TYPE: 2.0
|
|
|
- GAMMA: 0.1
|
|
|
- GRADIENT_ACCUMULATION_STEPS: 1
|
|
|
- IMS_PER_BATCH: 32
|
|
|
- LR_SCHEDULER_NAME: WarmupCosineLR
|
|
|
- MAX_ITER: 20000
|
|
|
- MOMENTUM: 0.9
|
|
|
- NESTEROV: false
|
|
|
- OPTIMIZER: ADAMW
|
|
|
- REFERENCE_WORLD_SIZE: 0
|
|
|
- STEPS:
|
|
|
- - 10000
|
|
|
- WARMUP_FACTOR: 0.01
|
|
|
- WARMUP_ITERS: 333
|
|
|
- WARMUP_METHOD: linear
|
|
|
- WEIGHT_DECAY: 0.05
|
|
|
- WEIGHT_DECAY_BIAS: null
|
|
|
- WEIGHT_DECAY_NORM: 0.0
|
|
|
-TEST:
|
|
|
- AUG:
|
|
|
- ENABLED: false
|
|
|
- FLIP: true
|
|
|
- MAX_SIZE: 4000
|
|
|
- MIN_SIZES:
|
|
|
- - 400
|
|
|
- - 500
|
|
|
- - 600
|
|
|
- - 700
|
|
|
- - 800
|
|
|
- - 900
|
|
|
- - 1000
|
|
|
- - 1100
|
|
|
- - 1200
|
|
|
- DETECTIONS_PER_IMAGE: 100
|
|
|
- EVAL_PERIOD: 1000
|
|
|
- EXPECTED_RESULTS: []
|
|
|
- KEYPOINT_OKS_SIGMAS: []
|
|
|
- PRECISE_BN:
|
|
|
- ENABLED: false
|
|
|
- NUM_ITER: 200
|
|
|
-VERSION: 2
|
|
|
-VIS_PERIOD: 0
|