| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351 |
- AUG:
- DETR: true
- CACHE_DIR: /mnt/localdata/users/yupanhuang/cache/huggingface
- CUDNN_BENCHMARK: false
- DATALOADER:
- ASPECT_RATIO_GROUPING: true
- FILTER_EMPTY_ANNOTATIONS: false
- NUM_WORKERS: 4
- REPEAT_THRESHOLD: 0.0
- SAMPLER_TRAIN: TrainingSampler
- DATASETS:
- PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
- PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
- PROPOSAL_FILES_TEST: []
- PROPOSAL_FILES_TRAIN: []
- TEST:
- - scihub_train
- TRAIN:
- - scihub_train
- GLOBAL:
- HACK: 1.0
- ICDAR_DATA_DIR_TEST: ''
- ICDAR_DATA_DIR_TRAIN: ''
- INPUT:
- CROP:
- ENABLED: true
- SIZE:
- - 384
- - 600
- TYPE: absolute_range
- FORMAT: RGB
- MASK_FORMAT: polygon
- MAX_SIZE_TEST: 1333
- MAX_SIZE_TRAIN: 1333
- MIN_SIZE_TEST: 800
- MIN_SIZE_TRAIN:
- - 480
- - 512
- - 544
- - 576
- - 608
- - 640
- - 672
- - 704
- - 736
- - 768
- - 800
- MIN_SIZE_TRAIN_SAMPLING: choice
- RANDOM_FLIP: horizontal
- MODEL:
- ANCHOR_GENERATOR:
- ANGLES:
- - - -90
- - 0
- - 90
- ASPECT_RATIOS:
- - - 0.5
- - 1.0
- - 2.0
- NAME: DefaultAnchorGenerator
- OFFSET: 0.0
- SIZES:
- - - 32
- - - 64
- - - 128
- - - 256
- - - 512
- BACKBONE:
- FREEZE_AT: 2
- NAME: build_vit_fpn_backbone
- CONFIG_PATH: ''
- DEVICE: cuda
- FPN:
- FUSE_TYPE: sum
- IN_FEATURES:
- - layer3
- - layer5
- - layer7
- - layer11
- NORM: ''
- OUT_CHANNELS: 256
- IMAGE_ONLY: true
- KEYPOINT_ON: false
- LOAD_PROPOSALS: false
- MASK_ON: true
- META_ARCHITECTURE: VLGeneralizedRCNN
- PANOPTIC_FPN:
- COMBINE:
- ENABLED: true
- INSTANCES_CONFIDENCE_THRESH: 0.5
- OVERLAP_THRESH: 0.5
- STUFF_AREA_LIMIT: 4096
- INSTANCE_LOSS_WEIGHT: 1.0
- PIXEL_MEAN:
- - 127.5
- - 127.5
- - 127.5
- PIXEL_STD:
- - 127.5
- - 127.5
- - 127.5
- PROPOSAL_GENERATOR:
- MIN_SIZE: 0
- NAME: RPN
- RESNETS:
- DEFORM_MODULATED: false
- DEFORM_NUM_GROUPS: 1
- DEFORM_ON_PER_STAGE:
- - false
- - false
- - false
- - false
- DEPTH: 50
- NORM: FrozenBN
- NUM_GROUPS: 1
- OUT_FEATURES:
- - res4
- RES2_OUT_CHANNELS: 256
- RES5_DILATION: 1
- STEM_OUT_CHANNELS: 64
- STRIDE_IN_1X1: true
- WIDTH_PER_GROUP: 64
- RETINANET:
- BBOX_REG_LOSS_TYPE: smooth_l1
- BBOX_REG_WEIGHTS:
- - 1.0
- - 1.0
- - 1.0
- - 1.0
- FOCAL_LOSS_ALPHA: 0.25
- FOCAL_LOSS_GAMMA: 2.0
- IN_FEATURES:
- - p3
- - p4
- - p5
- - p6
- - p7
- IOU_LABELS:
- - 0
- - -1
- - 1
- IOU_THRESHOLDS:
- - 0.4
- - 0.5
- NMS_THRESH_TEST: 0.5
- NORM: ''
- NUM_CLASSES: 10
- NUM_CONVS: 4
- PRIOR_PROB: 0.01
- SCORE_THRESH_TEST: 0.05
- SMOOTH_L1_LOSS_BETA: 0.1
- TOPK_CANDIDATES_TEST: 1000
- ROI_BOX_CASCADE_HEAD:
- BBOX_REG_WEIGHTS:
- - - 10.0
- - 10.0
- - 5.0
- - 5.0
- - - 20.0
- - 20.0
- - 10.0
- - 10.0
- - - 30.0
- - 30.0
- - 15.0
- - 15.0
- IOUS:
- - 0.5
- - 0.6
- - 0.7
- ROI_BOX_HEAD:
- BBOX_REG_LOSS_TYPE: smooth_l1
- BBOX_REG_LOSS_WEIGHT: 1.0
- BBOX_REG_WEIGHTS:
- - 10.0
- - 10.0
- - 5.0
- - 5.0
- CLS_AGNOSTIC_BBOX_REG: true
- CONV_DIM: 256
- FC_DIM: 1024
- NAME: FastRCNNConvFCHead
- NORM: ''
- NUM_CONV: 0
- NUM_FC: 2
- POOLER_RESOLUTION: 7
- POOLER_SAMPLING_RATIO: 0
- POOLER_TYPE: ROIAlignV2
- SMOOTH_L1_BETA: 0.0
- TRAIN_ON_PRED_BOXES: false
- ROI_HEADS:
- BATCH_SIZE_PER_IMAGE: 512
- IN_FEATURES:
- - p2
- - p3
- - p4
- - p5
- IOU_LABELS:
- - 0
- - 1
- IOU_THRESHOLDS:
- - 0.5
- NAME: CascadeROIHeads
- NMS_THRESH_TEST: 0.5
- NUM_CLASSES: 10
- POSITIVE_FRACTION: 0.25
- PROPOSAL_APPEND_GT: true
- SCORE_THRESH_TEST: 0.05
- ROI_KEYPOINT_HEAD:
- CONV_DIMS:
- - 512
- - 512
- - 512
- - 512
- - 512
- - 512
- - 512
- - 512
- LOSS_WEIGHT: 1.0
- MIN_KEYPOINTS_PER_IMAGE: 1
- NAME: KRCNNConvDeconvUpsampleHead
- NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
- NUM_KEYPOINTS: 17
- POOLER_RESOLUTION: 14
- POOLER_SAMPLING_RATIO: 0
- POOLER_TYPE: ROIAlignV2
- ROI_MASK_HEAD:
- CLS_AGNOSTIC_MASK: false
- CONV_DIM: 256
- NAME: MaskRCNNConvUpsampleHead
- NORM: ''
- NUM_CONV: 4
- POOLER_RESOLUTION: 14
- POOLER_SAMPLING_RATIO: 0
- POOLER_TYPE: ROIAlignV2
- RPN:
- BATCH_SIZE_PER_IMAGE: 256
- BBOX_REG_LOSS_TYPE: smooth_l1
- BBOX_REG_LOSS_WEIGHT: 1.0
- BBOX_REG_WEIGHTS:
- - 1.0
- - 1.0
- - 1.0
- - 1.0
- BOUNDARY_THRESH: -1
- CONV_DIMS:
- - -1
- HEAD_NAME: StandardRPNHead
- IN_FEATURES:
- - p2
- - p3
- - p4
- - p5
- - p6
- IOU_LABELS:
- - 0
- - -1
- - 1
- IOU_THRESHOLDS:
- - 0.3
- - 0.7
- LOSS_WEIGHT: 1.0
- NMS_THRESH: 0.7
- POSITIVE_FRACTION: 0.5
- POST_NMS_TOPK_TEST: 1000
- POST_NMS_TOPK_TRAIN: 2000
- PRE_NMS_TOPK_TEST: 1000
- PRE_NMS_TOPK_TRAIN: 2000
- SMOOTH_L1_BETA: 0.0
- SEM_SEG_HEAD:
- COMMON_STRIDE: 4
- CONVS_DIM: 128
- IGNORE_VALUE: 255
- IN_FEATURES:
- - p2
- - p3
- - p4
- - p5
- LOSS_WEIGHT: 1.0
- NAME: SemSegFPNHead
- NORM: GN
- NUM_CLASSES: 10
- VIT:
- DROP_PATH: 0.1
- IMG_SIZE:
- - 224
- - 224
- NAME: layoutlmv3_base
- OUT_FEATURES:
- - layer3
- - layer5
- - layer7
- - layer11
- POS_TYPE: abs
- WEIGHTS:
- OUTPUT_DIR:
- SCIHUB_DATA_DIR_TRAIN: /mnt/petrelfs/share_data/zhaozhiyuan/publaynet/layout_scihub/train
- SEED: 42
- SOLVER:
- AMP:
- ENABLED: true
- BACKBONE_MULTIPLIER: 1.0
- BASE_LR: 0.0002
- BIAS_LR_FACTOR: 1.0
- CHECKPOINT_PERIOD: 2000
- CLIP_GRADIENTS:
- CLIP_TYPE: full_model
- CLIP_VALUE: 1.0
- ENABLED: true
- NORM_TYPE: 2.0
- GAMMA: 0.1
- GRADIENT_ACCUMULATION_STEPS: 1
- IMS_PER_BATCH: 32
- LR_SCHEDULER_NAME: WarmupCosineLR
- MAX_ITER: 20000
- MOMENTUM: 0.9
- NESTEROV: false
- OPTIMIZER: ADAMW
- REFERENCE_WORLD_SIZE: 0
- STEPS:
- - 10000
- WARMUP_FACTOR: 0.01
- WARMUP_ITERS: 333
- WARMUP_METHOD: linear
- WEIGHT_DECAY: 0.05
- WEIGHT_DECAY_BIAS: null
- WEIGHT_DECAY_NORM: 0.0
- TEST:
- AUG:
- ENABLED: false
- FLIP: true
- MAX_SIZE: 4000
- MIN_SIZES:
- - 400
- - 500
- - 600
- - 700
- - 800
- - 900
- - 1000
- - 1100
- - 1200
- DETECTIONS_PER_IMAGE: 100
- EVAL_PERIOD: 1000
- EXPECTED_RESULTS: []
- KEYPOINT_OKS_SIGMAS: []
- PRECISE_BN:
- ENABLED: false
- NUM_ITER: 200
- VERSION: 2
- VIS_PERIOD: 0
|