Commit ·
506cc79
1
Parent(s): e9ad675
add dyhead configs & weights
Browse files- dyhead/atss_r50_config.yaml +28 -0
- dyhead/atss_r50_model.bin +3 -0
- dyhead/atss_swin_tiny_config.yaml +34 -0
- dyhead/atss_swin_tiny_model.bin +3 -0
- dyhead/faster_rcnn_r50_config.yaml +45 -0
- dyhead/faster_rcnn_r50_model.bin +3 -0
- dyhead/retinanet_r50_config.yaml +28 -0
- dyhead/retinanet_r50_model.bin +3 -0
dyhead/atss_r50_config.yaml
ADDED
|
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
MODEL:
|
| 2 |
+
META_ARCHITECTURE: "ATSS"
|
| 3 |
+
WEIGHTS: "detectron2://ImageNetPretrained/MSRA/R-50.pkl"
|
| 4 |
+
BACKBONE:
|
| 5 |
+
NAME: "build_retinanet_resnet_fpn_dyhead_backbone"
|
| 6 |
+
RESNETS:
|
| 7 |
+
DEPTH: 50
|
| 8 |
+
OUT_FEATURES: ["res3", "res4", "res5"]
|
| 9 |
+
FPN:
|
| 10 |
+
IN_FEATURES: ["res3", "res4", "res5"]
|
| 11 |
+
DYHEAD:
|
| 12 |
+
NUM_CONVS: 6
|
| 13 |
+
CHANNELS: 256
|
| 14 |
+
ANCHOR_GENERATOR:
|
| 15 |
+
SIZES: !!python/object/apply:eval ["[[x*2,] for x in [32, 64, 128, 256, 512 ]]"]
|
| 16 |
+
ASPECT_RATIOS: [1.0,]
|
| 17 |
+
OFFSET: 0.5
|
| 18 |
+
ATSS:
|
| 19 |
+
NUM_CONVS: 0
|
| 20 |
+
DATASETS:
|
| 21 |
+
TRAIN: ("coco_2017_train",)
|
| 22 |
+
TEST: ("coco_2017_val",)
|
| 23 |
+
SOLVER:
|
| 24 |
+
IMS_PER_BATCH: 16
|
| 25 |
+
BASE_LR: 0.01
|
| 26 |
+
STEPS: (60000, 80000)
|
| 27 |
+
MAX_ITER: 90000
|
| 28 |
+
VERSION: 2
|
dyhead/atss_r50_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2eee9e73748ee6152ba5edce00a8b0579b808ae340d3040f540bc8b7ca8ecf3
|
| 3 |
+
size 155972489
|
dyhead/atss_swin_tiny_config.yaml
ADDED
|
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
MODEL:
|
| 2 |
+
META_ARCHITECTURE: "ATSS"
|
| 3 |
+
WEIGHTS: "swin_tiny_patch4_window7_224_d2.pth"
|
| 4 |
+
PIXEL_MEAN: [123.675, 116.28, 103.53]
|
| 5 |
+
PIXEL_STD: [58.395, 57.12, 57.375]
|
| 6 |
+
BACKBONE:
|
| 7 |
+
NAME: "build_retinanet_swin_fpn_dyhead_backbone"
|
| 8 |
+
SWINT:
|
| 9 |
+
OUT_FEATURES: ["stage3", "stage4", "stage5"]
|
| 10 |
+
FPN:
|
| 11 |
+
IN_FEATURES: ["stage3", "stage4", "stage5"]
|
| 12 |
+
DYHEAD:
|
| 13 |
+
NUM_CONVS: 6
|
| 14 |
+
CHANNELS: 256
|
| 15 |
+
ANCHOR_GENERATOR:
|
| 16 |
+
SIZES: !!python/object/apply:eval ["[[x*2,] for x in [32, 64, 128, 256, 512 ]]"]
|
| 17 |
+
ASPECT_RATIOS: [1.0,]
|
| 18 |
+
OFFSET: 0.5
|
| 19 |
+
ATSS:
|
| 20 |
+
NUM_CONVS: 0
|
| 21 |
+
DATASETS:
|
| 22 |
+
TRAIN: ("coco_2017_train",)
|
| 23 |
+
TEST: ("coco_2017_val",)
|
| 24 |
+
SOLVER:
|
| 25 |
+
IMS_PER_BATCH: 32
|
| 26 |
+
BASE_LR: 0.0001
|
| 27 |
+
WEIGHT_DECAY: 0.05
|
| 28 |
+
STEPS: (60000, 80000)
|
| 29 |
+
MAX_ITER: 90000
|
| 30 |
+
OPTIMIZER: "ADAMW"
|
| 31 |
+
INPUT:
|
| 32 |
+
FORMAT: "RGB"
|
| 33 |
+
MIN_SIZE_TRAIN: (640, 672, 704, 736, 768, 800)
|
| 34 |
+
VERSION: 2
|
dyhead/atss_swin_tiny_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c398fa3a779b4825e7d043d6451eca237db25386be509165654f0819dee8a26
|
| 3 |
+
size 169728933
|
dyhead/faster_rcnn_r50_config.yaml
ADDED
|
@@ -0,0 +1,45 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
MODEL:
|
| 2 |
+
META_ARCHITECTURE: "GeneralizedRCNN"
|
| 3 |
+
WEIGHTS: "detectron2://ImageNetPretrained/MSRA/R-50.pkl"
|
| 4 |
+
BACKBONE:
|
| 5 |
+
NAME: "build_resnet_fpn_dyhead_backbone"
|
| 6 |
+
RESNETS:
|
| 7 |
+
DEPTH: 50
|
| 8 |
+
OUT_FEATURES: ["res2", "res3", "res4", "res5"]
|
| 9 |
+
FPN:
|
| 10 |
+
IN_FEATURES: ["res2", "res3", "res4", "res5"]
|
| 11 |
+
DYHEAD:
|
| 12 |
+
NUM_CONVS: 6
|
| 13 |
+
CHANNELS: 256
|
| 14 |
+
ANCHOR_GENERATOR:
|
| 15 |
+
SIZES: [[32], [64], [128], [256], [512]] # One size for each in feature map
|
| 16 |
+
ASPECT_RATIOS: [[0.5, 1.0, 2.0]] # Three aspect ratios (same for all in feature maps)
|
| 17 |
+
RPN:
|
| 18 |
+
IN_FEATURES: ["p2", "p3", "p4", "p5", "p6"]
|
| 19 |
+
PRE_NMS_TOPK_TRAIN: 2000 # Per FPN level
|
| 20 |
+
PRE_NMS_TOPK_TEST: 1000 # Per FPN level
|
| 21 |
+
# Detectron1 uses 2000 proposals per-batch,
|
| 22 |
+
# (See "modeling/rpn/rpn_outputs.py" for details of this legacy issue)
|
| 23 |
+
# which is approximately 1000 proposals per-image since the default batch size for FPN is 2.
|
| 24 |
+
POST_NMS_TOPK_TRAIN: 1000
|
| 25 |
+
POST_NMS_TOPK_TEST: 1000
|
| 26 |
+
ROI_HEADS:
|
| 27 |
+
NAME: "StandardROIHeads"
|
| 28 |
+
IN_FEATURES: ["p2", "p3", "p4", "p5"]
|
| 29 |
+
ROI_BOX_HEAD:
|
| 30 |
+
NAME: "FastRCNNConvFCHead"
|
| 31 |
+
NUM_FC: 2
|
| 32 |
+
POOLER_RESOLUTION: 7
|
| 33 |
+
ROI_MASK_HEAD:
|
| 34 |
+
NAME: "MaskRCNNConvUpsampleHead"
|
| 35 |
+
NUM_CONV: 4
|
| 36 |
+
POOLER_RESOLUTION: 14
|
| 37 |
+
DATASETS:
|
| 38 |
+
TRAIN: ("coco_2017_train",)
|
| 39 |
+
TEST: ("coco_2017_val",)
|
| 40 |
+
SOLVER:
|
| 41 |
+
IMS_PER_BATCH: 16
|
| 42 |
+
BASE_LR: 0.02
|
| 43 |
+
STEPS: (60000, 80000)
|
| 44 |
+
MAX_ITER: 90000
|
| 45 |
+
VERSION: 2
|
dyhead/faster_rcnn_r50_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35d7229f84f96c81cddb8d0c7b9a706939b0dd987e7733f8cd0ee9c75c560c82
|
| 3 |
+
size 213392451
|
dyhead/retinanet_r50_config.yaml
ADDED
|
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
MODEL:
|
| 2 |
+
META_ARCHITECTURE: "RetinaNet"
|
| 3 |
+
WEIGHTS: "detectron2://ImageNetPretrained/MSRA/R-50.pkl"
|
| 4 |
+
BACKBONE:
|
| 5 |
+
NAME: "build_retinanet_resnet_fpn_dyhead_backbone"
|
| 6 |
+
RESNETS:
|
| 7 |
+
DEPTH: 50
|
| 8 |
+
OUT_FEATURES: ["res3", "res4", "res5"]
|
| 9 |
+
FPN:
|
| 10 |
+
IN_FEATURES: ["res3", "res4", "res5"]
|
| 11 |
+
DYHEAD:
|
| 12 |
+
NUM_CONVS: 6
|
| 13 |
+
CHANNELS: 256
|
| 14 |
+
ANCHOR_GENERATOR:
|
| 15 |
+
SIZES: !!python/object/apply:eval ["[[x, x * 2**(1.0/3), x * 2**(2.0/3) ] for x in [32, 64, 128, 256, 512 ]]"]
|
| 16 |
+
RETINANET:
|
| 17 |
+
IOU_THRESHOLDS: [0.4, 0.5]
|
| 18 |
+
IOU_LABELS: [0, -1, 1]
|
| 19 |
+
SMOOTH_L1_LOSS_BETA: 0.0
|
| 20 |
+
DATASETS:
|
| 21 |
+
TRAIN: ("coco_2017_train",)
|
| 22 |
+
TEST: ("coco_2017_val",)
|
| 23 |
+
SOLVER:
|
| 24 |
+
IMS_PER_BATCH: 16
|
| 25 |
+
BASE_LR: 0.01
|
| 26 |
+
STEPS: (60000, 80000)
|
| 27 |
+
MAX_ITER: 90000
|
| 28 |
+
VERSION: 2
|
dyhead/retinanet_r50_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:798b595d6e45f826474eb97b2fe56cebf46b33923c24b03d92553efb3399b694
|
| 3 |
+
size 181741239
|