forked from Tencent/ncnn
-
Notifications
You must be signed in to change notification settings - Fork 18
/
Copy pathpeleenetssd.py
120 lines (98 loc) · 3.62 KB
/
peleenetssd.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
# Tencent is pleased to support the open source community by making ncnn available.
#
# Copyright (C) 2020 THL A29 Limited, a Tencent company. All rights reserved.
#
# Licensed under the BSD 3-Clause License (the "License"); you may not use this file except
# in compliance with the License. You may obtain a copy of the License at
#
# https://opensource.org/licenses/BSD-3-Clause
#
# Unless required by applicable law or agreed to in writing, software distributed
# under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
# CONDITIONS OF ANY KIND, either express or implied. See the License for the
# specific language governing permissions and limitations under the License.
import sys
import cv2
import numpy as np
from ncnn.model_zoo import get_model
def draw_detection_objects_seg(image, class_names, objects, mat_map):
color = [128, 255, 128, 244, 35, 232]
color_count = len(color)
for obj in objects:
print(
"%d = %.5f at %.2f %.2f %.2f x %.2f\n"
% (obj.label, obj.prob, obj.rect.x, obj.rect.y, obj.rect.w, obj.rect.h)
)
cv2.rectangle(
image,
(int(obj.rect.x), int(obj.rect.y)),
(int(obj.rect.x + obj.rect.w), int(obj.rect.y + obj.rect.h)),
(255, 0, 0),
)
text = "%s %.1f%%" % (class_names[int(obj.label)], obj.prob * 100)
label_size, baseLine = cv2.getTextSize(text, cv2.FONT_HERSHEY_SIMPLEX, 0.5, 1)
x = obj.rect.x
y = obj.rect.y - label_size[1] - baseLine
if y < 0:
y = 0
if x + label_size[0] > image.shape[1]:
x = image.shape[1] - label_size[0]
cv2.rectangle(
image,
(int(x), int(y)),
(int(x + label_size[0]), int(y + label_size[1] + baseLine)),
(255, 255, 255),
-1,
)
cv2.putText(
image,
text,
(int(x), int(y + label_size[1])),
cv2.FONT_HERSHEY_SIMPLEX,
0.5,
(0, 0, 0),
)
width = mat_map.w
height = mat_map.h
size = mat_map.c
img_index2 = 0
threshold = 0.45
ptr2 = np.array(mat_map)
for i in range(height):
ptr1 = image[i].flatten()
img_index1 = 0
for j in range(width):
maxima = threshold
index = -1
for c in range(size):
# const float* ptr3 = ptr2 + c*width*height
ptr3 = ptr2[c].flatten()
if ptr3[img_index2] > maxima:
maxima = ptr3[img_index2]
index = c
if index > -1:
color_index = (index) * 3
if color_index < color_count:
b = color[color_index]
g = color[color_index + 1]
r = color[color_index + 2]
ptr1[img_index1] = b / 2 + ptr1[img_index1] / 2
ptr1[img_index1 + 1] = g / 2 + ptr1[img_index1 + 1] / 2
ptr1[img_index1 + 2] = r / 2 + ptr1[img_index1 + 2] / 2
img_index1 += 3
img_index2 += 1
image[i] = ptr1.reshape(image[i].shape)
cv2.imshow("image", image)
cv2.waitKey(0)
if __name__ == "__main__":
if len(sys.argv) != 2:
print("Usage: %s [imagepath]\n" % (sys.argv[0]))
sys.exit(0)
imagepath = sys.argv[1]
m = cv2.imread(imagepath)
if m is None:
print("cv2.imread %s failed\n" % (imagepath))
sys.exit(0)
net = get_model("peleenet_ssd", num_threads=4, use_gpu=True)
objects, seg_out = net(m)
draw_detection_objects_seg(m, net.class_names, objects, seg_out)