Bryceee commited on
Commit
e1e2617
·
verified ·
1 Parent(s): 8195a88

Upload maskdino_Swinl_bs16_50ep_4s_dowsample1_2048_panoramic_x-ray_Mandibular_Canal_Maxillary_Sinus.yaml

Browse files
maskdino_Swinl_bs16_50ep_4s_dowsample1_2048_panoramic_x-ray_Mandibular_Canal_Maxillary_Sinus.yaml ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _BASE_: ../Base-COCO-InstanceSegmentation.yaml
2
+ DATASETS:
3
+ TRAIN: ("panoramic_x-ray_Mandibular_Canal_Maxillary_Sinus",)
4
+ TEST: ("panoramic_x-ray_Mandibular_Canal_Maxillary_Sinus",)
5
+ MODEL:
6
+ META_ARCHITECTURE: "MaskDINO"
7
+ BACKBONE:
8
+ NAME: "D2SwinTransformer"
9
+ SWIN:
10
+ EMBED_DIM: 192
11
+ DEPTHS: [ 2, 2, 18, 2 ]
12
+ NUM_HEADS: [ 6, 12, 24, 48 ]
13
+ WINDOW_SIZE: 12
14
+ APE: False
15
+ DROP_PATH_RATE: 0.3
16
+ PATCH_NORM: True
17
+ PRETRAIN_IMG_SIZE: 384
18
+ WEIGHTS: "swin_large_patch4_window12_384_22k.pkl"
19
+ PIXEL_MEAN: [ 123.675, 116.280, 103.530 ]
20
+ PIXEL_STD: [ 58.395, 57.120, 57.375 ]
21
+ # head
22
+ SEM_SEG_HEAD:
23
+ NAME: "MaskDINOHead"
24
+ IGNORE_VALUE: 255
25
+ NUM_CLASSES: 2
26
+ LOSS_WEIGHT: 1.0
27
+ CONVS_DIM: 256
28
+ MASK_DIM: 256
29
+ NORM: "GN"
30
+ # pixel decoder
31
+ PIXEL_DECODER_NAME: "MaskDINOEncoder"
32
+ DIM_FEEDFORWARD: 2048
33
+ NUM_FEATURE_LEVELS: 4
34
+ TOTAL_NUM_FEATURE_LEVELS: 5
35
+ IN_FEATURES: ["res2", "res3", "res4", "res5"]
36
+ DEFORMABLE_TRANSFORMER_ENCODER_IN_FEATURES: ["res2","res3", "res4", "res5"]
37
+ COMMON_STRIDE: 4
38
+ TRANSFORMER_ENC_LAYERS: 6
39
+ FEATURE_ORDER: "low2high"
40
+ MaskDINO:
41
+ TRANSFORMER_DECODER_NAME: "MaskDINODecoder"
42
+ DEEP_SUPERVISION: True
43
+ NO_OBJECT_WEIGHT: 0.1
44
+ CLASS_WEIGHT: 4.0
45
+ MASK_WEIGHT: 5.0
46
+ DICE_WEIGHT: 5.0
47
+ BOX_WEIGHT: 5.0
48
+ GIOU_WEIGHT: 2.0
49
+ HIDDEN_DIM: 256
50
+ NUM_OBJECT_QUERIES: 300
51
+ NHEADS: 8
52
+ DROPOUT: 0.0
53
+ DIM_FEEDFORWARD: 2048
54
+ ENC_LAYERS: 0
55
+ PRE_NORM: False
56
+ ENFORCE_INPUT_PROJ: False
57
+ SIZE_DIVISIBILITY: 32
58
+ DEC_LAYERS: 9 # 9+1, 9 decoder layers, add one for the loss on learnable query
59
+ TRAIN_NUM_POINTS: 12544
60
+ OVERSAMPLE_RATIO: 3.0
61
+ IMPORTANCE_SAMPLE_RATIO: 0.75
62
+ EVAL_FLAG: 1
63
+ INITIAL_PRED: True
64
+ TWO_STAGE: True
65
+ DN: "seg"
66
+ DN_NUM: 100
67
+ INITIALIZE_BOX_TYPE: 'bitmask'
68
+ TEST:
69
+ SEMANTIC_ON: False
70
+ INSTANCE_ON: True
71
+ PANOPTIC_ON: False
72
+ OVERLAP_THRESHOLD: 0.8
73
+ OBJECT_MASK_THRESHOLD: 0.25
74
+
75
+ SOLVER:
76
+ IMS_PER_BATCH: 2
77
+ BASE_LR: 0.0001
78
+ STEPS: (9000, 9500)
79
+ MAX_ITER: 10000
80
+ AMP:
81
+ ENABLED: True
82
+ TEST:
83
+ EVAL_PERIOD: 5000
84
+ # EVAL_FLAG: 1