Skip to content

Commit 9e803ad

Browse files
committed
depth model
2 parents 681ab4c + e60cc45 commit 9e803ad

45 files changed

Lines changed: 895 additions & 297 deletions

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

README.md

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,9 @@
11
# InSPyReNet: Inverse Saliency Pyramid Reconstruction Network for Salient Object Detection
2+
<p align="center">
3+
4+
<img src="./figures/Title.png" alt="Logo" width="200" height="auto">
5+
6+
</p>
27
<p align="center">
38

49
<img src="./figures/figure1.png" alt="Logo" width="300" height="auto">

configs/InSPyReNetD_Res2Net50.yaml

Lines changed: 90 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,90 @@
1+
Model:
2+
name: "InSPyReNetD_Res2Net50"
3+
depth: 64
4+
pretrained: True
5+
base_size: [384, 384]
6+
PM:
7+
patch_size: 384
8+
stride: 192
9+
10+
Train:
11+
Dataset:
12+
type: "RGB_Dataset"
13+
root: "data/RGB_Dataset/Train_Dataset"
14+
sets: ['DUTS-TR']
15+
transforms:
16+
resize:
17+
size: [384, 384]
18+
random_scale_crop:
19+
range: [0.75, 1.25]
20+
random_flip:
21+
lr: True
22+
ud: False
23+
random_rotate:
24+
range: [-10, 10]
25+
random_image_enhance:
26+
methods: ['contrast', 'sharpness', 'brightness']
27+
tonumpy: NULL
28+
normalize:
29+
mean: [0.485, 0.456, 0.406]
30+
std: [0.229, 0.224, 0.225]
31+
totensor: NULL
32+
Dataloader:
33+
batch_size: 6
34+
shuffle: True
35+
num_workers: 8
36+
pin_memory: True
37+
Optimizer:
38+
type: "Adam"
39+
lr: 1.0e-05
40+
weight_decay: 0.0
41+
mixed_precision: False
42+
Scheduler:
43+
type: "PolyLr"
44+
epoch: 60
45+
gamma: 0.9
46+
minimum_lr: 1.0e-07
47+
warmup_iteration: 12000
48+
Checkpoint:
49+
checkpoint_epoch: 1
50+
checkpoint_dir: "snapshots/InSPyReNetD_Res2Net50"
51+
Debug:
52+
keys: ['gaussian', 'laplacian']
53+
HyperTune:
54+
HyperParameter: ['Train', 'Optimizer', 'lr']
55+
Range: [1.0e-6, 2.4e-5, 24]
56+
57+
Test:
58+
Dataset:
59+
type: "RGB_Dataset"
60+
root: "data/RGB_Dataset/Test_Dataset"
61+
sets: ['DUTS-TE', 'DUT-OMRON', 'ECSSD', 'HKU-IS', 'PASCAL-S']
62+
transforms:
63+
# resize:
64+
# size: [384, 384]
65+
tonumpy: NULL
66+
normalize:
67+
mean: [0.485, 0.456, 0.406]
68+
std: [0.229, 0.224, 0.225]
69+
totensor: NULL
70+
transforms_PM:
71+
resize:
72+
size: NULL
73+
pm : True
74+
tonumpy: NULL
75+
normalize:
76+
mean: [0.485, 0.456, 0.406]
77+
std: [0.229, 0.224, 0.225]
78+
totensor: NULL
79+
Dataloader:
80+
num_workers: 8
81+
pin_memory: True
82+
Checkpoint:
83+
checkpoint_dir: "snapshots/InSPyReNetD_Res2Net50"
84+
85+
Eval:
86+
gt_root: "data/RGB_Dataset/Test_Dataset"
87+
pred_root: "snapshots/InSPyReNetD_Res2Net50"
88+
result_path: "results"
89+
datasets: ['DUTS-TE', 'DUT-OMRON', 'ECSSD', 'HKU-IS', 'PASCAL-S']
90+
metrics: ['Sm', 'mae', 'adpEm', 'maxEm', 'avgEm', 'adpFm', 'maxFm', 'avgFm', 'wFm']

configs/InSPyReNetD_SwinB.yaml

Lines changed: 89 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,89 @@
1+
Model:
2+
name: "InSPyReNetD_SwinB"
3+
depth: 64
4+
pretrained: True
5+
base_size: [384, 384]
6+
7+
8+
9+
Train:
10+
Dataset:
11+
type: "RGBD_Dataset"
12+
root: "data/RGBD_Dataset/Train_Dataset"
13+
sets: ['NJU2K+NLPR']
14+
transforms:
15+
resize:
16+
size: [384, 384]
17+
random_scale_crop:
18+
range: [0.75, 1.25]
19+
random_flip:
20+
lr: True
21+
ud: False
22+
random_rotate:
23+
range: [-10, 10]
24+
random_image_enhance:
25+
methods: ['contrast', 'sharpness', 'brightness']
26+
tonumpy: NULL
27+
normalize:
28+
mean: [0.485, 0.456, 0.406]
29+
std: [0.229, 0.224, 0.225]
30+
totensor: NULL
31+
Dataloader:
32+
batch_size: 6
33+
shuffle: True
34+
num_workers: 8
35+
pin_memory: False
36+
Optimizer:
37+
type: "Adam"
38+
lr: 1.0e-05
39+
weight_decay: 0.0
40+
mixed_precision: False
41+
Scheduler:
42+
type: "PolyLr"
43+
epoch: 300
44+
gamma: 0.9
45+
minimum_lr: 1.0e-07
46+
warmup_iteration: 12000
47+
Checkpoint:
48+
checkpoint_epoch: 1
49+
checkpoint_dir: "snapshots/InSPyReNetD_SwinB"
50+
Debug:
51+
keys: ['gaussian', 'laplacian']
52+
HyperTune:
53+
HyperParameter: ['Train', 'Optimizer', 'lr']
54+
Range: [1.0e-6, 2.4e-5, 24]
55+
56+
Test:
57+
Dataset:
58+
type: "RGBD_Dataset"
59+
root: "data/RGBD_Dataset/Test_Dataset"
60+
sets: ['DES', 'LFSD', 'NJU2K', 'NLPR', 'SIP', 'STERE']
61+
transforms:
62+
resize:
63+
size: [384, 384]
64+
tonumpy: NULL
65+
normalize:
66+
mean: [0.485, 0.456, 0.406]
67+
std: [0.229, 0.224, 0.225]
68+
totensor: NULL
69+
transforms_PM:
70+
resize:
71+
size: NULL
72+
pm : True
73+
tonumpy: NULL
74+
normalize:
75+
mean: [0.485, 0.456, 0.406]
76+
std: [0.229, 0.224, 0.225]
77+
totensor: NULL
78+
Dataloader:
79+
num_workers: 8
80+
pin_memory: True
81+
Checkpoint:
82+
checkpoint_dir: "snapshots/InSPyReNetD_SwinB"
83+
84+
Eval:
85+
gt_root: "data/RGBD_Dataset/Test_Dataset"
86+
pred_root: "snapshots/InSPyReNetD_SwinB"
87+
result_path: "results"
88+
datasets: ['DES', 'LFSD', 'NJU2K', 'NLPR', 'SIP', 'STERE']
89+
metrics: ['Sm', 'mae', 'adpEm', 'maxEm', 'avgEm', 'adpFm', 'maxFm', 'avgFm', 'wFm']

configs/InSPyReNet_Res2Net101.yaml

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,10 @@ Model:
22
name: "InSPyReNet_Res2Net101"
33
depth: 64
44
pretrained: True
5-
PM:
6-
patch_size: 384
7-
stride: 192
5+
base_size: [384, 384]
6+
PM:
7+
patch_size: 384
8+
stride: 192
89

910
Train:
1011
Dataset:
@@ -67,9 +68,9 @@ Test:
6768
std: [0.229, 0.224, 0.225]
6869
totensor: NULL
6970
transforms_PM:
70-
dynamic_resize:
71-
patch_size: 384
72-
stride: 192
71+
resize:
72+
size: NULL
73+
pm : True
7374
tonumpy: NULL
7475
normalize:
7576
mean: [0.485, 0.456, 0.406]

configs/InSPyReNet_Res2Net50.yaml

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,10 @@ Model:
22
name: "InSPyReNet_Res2Net50"
33
depth: 64
44
pretrained: True
5-
PM:
6-
patch_size: 384
7-
stride: 192
5+
base_size: [384, 384]
6+
PM:
7+
patch_size: 384
8+
stride: 192
89

910
Train:
1011
Dataset:
@@ -67,9 +68,9 @@ Test:
6768
std: [0.229, 0.224, 0.225]
6869
totensor: NULL
6970
transforms_PM:
70-
dynamic_resize:
71-
patch_size: 384
72-
stride: 192
71+
resize:
72+
size: NULL
73+
pm : True
7374
tonumpy: NULL
7475
normalize:
7576
mean: [0.485, 0.456, 0.406]

configs/InSPyReNet_SwinB.yaml

Lines changed: 6 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,7 @@ Model:
22
name: "InSPyReNet_SwinB"
33
depth: 64
44
pretrained: True
5-
PM:
6-
patch_size: 384
7-
stride: 96
5+
base_size: [384, 384]
86

97
Train:
108
Dataset:
@@ -60,16 +58,17 @@ Test:
6058
sets: ['DUTS-TE', 'DUT-OMRON', 'ECSSD', 'HKU-IS', 'PASCAL-S']
6159
transforms:
6260
resize:
63-
size: [384, 384]
61+
size: NULL #[384, 384]
62+
pm : False
6463
tonumpy: NULL
6564
normalize:
6665
mean: [0.485, 0.456, 0.406]
6766
std: [0.229, 0.224, 0.225]
6867
totensor: NULL
6968
transforms_PM:
70-
dynamic_resize:
71-
patch_size: 384
72-
stride: 192
69+
resize:
70+
size: NULL
71+
pm : True
7372
tonumpy: NULL
7473
normalize:
7574
mean: [0.485, 0.456, 0.406]

configs/InSPyReNet_SwinL.yaml

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,10 @@ Model:
22
name: "InSPyReNet_SwinL"
33
depth: 64
44
pretrained: True
5-
PM:
6-
patch_size: 384
7-
stride: 192
5+
base_size: [384, 384]
6+
PM:
7+
patch_size: 384
8+
stride: 192
89

910
Train:
1011
Dataset:
@@ -67,9 +68,9 @@ Test:
6768
std: [0.229, 0.224, 0.225]
6869
totensor: NULL
6970
transforms_PM:
70-
dynamic_resize:
71-
patch_size: 384
72-
stride: 192
71+
resize:
72+
size: NULL
73+
pm : True
7374
tonumpy: NULL
7475
normalize:
7576
mean: [0.485, 0.456, 0.406]

configs/InSPyReNet_SwinS.yaml

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,10 @@ Model:
22
name: "InSPyReNet_SwinS"
33
depth: 64
44
pretrained: True
5-
PM:
6-
patch_size: 384
7-
stride: 192
5+
base_size: [384, 384]
6+
PM:
7+
patch_size: 384
8+
stride: 192
89

910
Train:
1011
Dataset:
@@ -67,9 +68,9 @@ Test:
6768
std: [0.229, 0.224, 0.225]
6869
totensor: NULL
6970
transforms_PM:
70-
dynamic_resize:
71-
patch_size: 384
72-
stride: 192
71+
resize:
72+
size: NULL
73+
pm : True
7374
tonumpy: NULL
7475
normalize:
7576
mean: [0.485, 0.456, 0.406]

configs/InSPyReNet_SwinT.yaml

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,10 @@ Model:
22
name: "InSPyReNet_SwinT"
33
depth: 64
44
pretrained: True
5-
PM:
6-
patch_size: 384
7-
stride: 192
5+
base_size: [384, 384]
6+
PM:
7+
patch_size: 384
8+
stride: 192
89

910
Train:
1011
Dataset:
@@ -67,9 +68,9 @@ Test:
6768
std: [0.229, 0.224, 0.225]
6869
totensor: NULL
6970
transforms_PM:
70-
dynamic_resize:
71-
patch_size: 384
72-
stride: 192
71+
resize:
72+
size: NULL
73+
pm : True
7374
tonumpy: NULL
7475
normalize:
7576
mean: [0.485, 0.456, 0.406]

configs/SotA/BASNet.yaml

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -2,9 +2,8 @@ Model:
22
name: "BASNet"
33
depth: None
44
pretrained: True
5-
PM:
6-
patch_size: 384
7-
stride: 96
5+
6+
87

98
Test:
109
Dataset:
@@ -13,16 +12,17 @@ Test:
1312
sets: ['DUTS-TE', 'DUT-OMRON', 'ECSSD', 'HKU-IS', 'PASCAL-S']
1413
transforms:
1514
resize:
16-
size: [384, 384]
15+
size: NULL #[384, 384]
16+
pm: False
1717
tonumpy: NULL
1818
normalize:
1919
mean: [0.485, 0.456, 0.406]
2020
std: [0.229, 0.224, 0.225]
2121
totensor: NULL
2222
transforms_PM:
23-
dynamic_resize:
24-
patch_size: 384
25-
stride: 192
23+
resize:
24+
size: NULL
25+
pm : True
2626
tonumpy: NULL
2727
normalize:
2828
mean: [0.485, 0.456, 0.406]

0 commit comments

Comments
 (0)