ncs2_raspberry_object_detection/detector.py at master · QuantuMobileSoftware/ncs2_raspberry_object_detection · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
from __future__ import print_function
import sys
import os
from argparse import ArgumentParser
import cv2
import time
import logging as log
from openvino.inference_engine import IENetwork, IEPlugin


def get_parser():
    parser = ArgumentParser()
    # Path to the folder with model and file to process
    parser.add_argument("-m", "--model_path", help="Path to the folder with the model", required=True, type=str)
    parser.add_argument("-i", "--input",
                        help="Path to video file or image. Default 'cam'", default="cam",
                        type=str)
    parser.add_argument("-o", "--output",
                        help="Path to folder to save file", default=None, type=str)

    parser.add_argument("-r", "--resolution", help="Resolution for the image example 640X480",
                        default='640X480', type=str)

    # Selecting a device to make DNN computations
    parser.add_argument("-d", "--device",
                        help="Target device CPU or MYRIAD"
                             "if CPU pass --cpu_extension as well", default="CPU",
                        type=str)
    #
    parser.add_argument("-l", "--cpu_extension",
                        help="Path to the MKLDNN library for the CPU check at"
                             "/deployment_tools/inference_engine/lib", type=str, default=None)


    # Labels for the neural network
    parser.add_argument("--labels", help="Labels mapping file", default=None, type=str)
    # Probability threshold
    parser.add_argument("-pt", "--prob_threshold", help="Probability threshold for detections filtering",
                        default=0.5, type=float)
    return parser


def main():
    log.basicConfig(format="[ %(levelname)s ] %(message)s", level=log.INFO, stream=sys.stdout)

    args = get_parser().parse_args()

    # Plugin initialization for specified device and load extensions library if specified
    log.info("Initializing plugin for {} device".format(args.device))
    plugin = IEPlugin(device=args.device)


    # Read IR
    for f in os.listdir(args.model_path):
        if f[-3:] == 'bin':
            wights = os.path.join(args.model_path, f)
        if f[-3:] == 'xml':
            model = os.path.join(args.model_path, f)

    log.info("Reading IR")
    net = IENetwork(model=model, weights=wights)
    input_blob = next(iter(net.inputs))
    out_blob = next(iter(net.outputs))

    # Set CPU extension
    if plugin.device == "CPU":
        plugin.add_cpu_extension(args.cpu_extension)
        supported_layers = plugin.get_supported_layers(net)
        not_supported_layers = [l for l in net.layers.keys() if l not in supported_layers]
        if len(not_supported_layers) != 0:
            log.error("Following layers are not supported by the plugin for specified device {}:\n {}".
                      format(plugin.device, ', '.join(not_supported_layers)))
            log.error("Please try to specify cpu extensions library path in command line parameters using -l "
                      "or --cpu_extension command line argument")
            sys.exit(1)

    log.info("Loading IR to the plugin")
    exec_net = plugin.load(network=net, num_requests=2)
    # Get labels dict
    if args.labels:
        labels_map = {}
        with open(args.labels, 'r') as f:
            for line in f:
                label = line.split(': ')
                labels_map[int(label[0])] = label[1].strip()
    # Read and pre-process input image
    n, c, h, w = net.inputs[input_blob].shape
    del net
    if args.input == 'cam':
        input_stream = 0
    elif len(args.input) < 3:
        input_stream = int(args.input)
    else:
        input_stream = args.input
        assert os.path.isfile(args.input), "Specified input file doesn't exist"

    cap = cv2.VideoCapture(input_stream)
    stream_w, stream_h = (int(x) for x in args.resolution.split('X'))
    cap.set(3, stream_w)
    cap.set(4, stream_h)
    cur_request_id = 0
    next_request_id = 1

    log.info("Starting inference in async mode...")
    log.info("To switch between sync and async modes press Tab button")
    log.info("To stop the demo execution press Esc button")

    render_time = 0
    freq = cv2.getTickFrequency()
    ret, frame = cap.read()
    is_async_mode = False

    #Write to the output file
    #add parameters

    if args.output:
        fps = cap.get(cv2.CAP_PROP_FPS)
        file_name = os.path.join(args.output, '{}-{}.avi'.format(time.strftime("%Y%m%d-%H%M%S"), args.device))
        out = cv2.VideoWriter(file_name, cv2.VideoWriter_fourcc('M', 'J', 'P', 'G'), fps, (640, 480))

    while cap.isOpened():

        t1 = cv2.getTickCount()

        if is_async_mode:
            ret, next_frame = cap.read()
        else:
            ret, frame = cap.read()
        if not ret:
            break

        initial_w = cap.get(3)
        initial_h = cap.get(4)
        # Main sync point:
        # in the truly Async mode we start the NEXT infer request, while waiting for the CURRENT to complete
        # in the regular mode we start the CURRENT request and immediately wait for it's completion
        inf_start = time.time()

        if is_async_mode:
            in_frame = cv2.resize(next_frame, (w, h))
            in_frame = in_frame.transpose((2, 0, 1))  # Change data layout from HWC to CHW
            in_frame = in_frame.reshape((n, c, h, w))
            exec_net.start_async(request_id=next_request_id, inputs={input_blob: in_frame})
        else:
            in_frame = cv2.resize(frame, (w, h))
            in_frame = in_frame.transpose((2, 0, 1))  # Change data layout from HWC to CHW
            in_frame = in_frame.reshape((n, c, h, w))
            exec_net.start_async(request_id=cur_request_id, inputs={input_blob: in_frame})

        if exec_net.requests[cur_request_id].wait(-1) == 0:
            inf_end = time.time()
            det_time = inf_end - inf_start

            # Parse detection results of the current request
            res = exec_net.requests[cur_request_id].outputs[out_blob]
            for obj in res[0][0]:
                # Draw only objects when probability more than specified threshold
                if obj[2] > args.prob_threshold:
                    xmin = int(obj[3] * initial_w)
                    ymin = int(obj[4] * initial_h)
                    xmax = int(obj[5] * initial_w)
                    ymax = int(obj[6] * initial_h)
                    class_id = int(obj[1])
                    # Draw box and label\class_id
                    color = (min(class_id * 4, 255), min(class_id * 3 + 100, 255), min(class_id * 2, 255))
                    cv2.rectangle(frame, (xmin, ymin), (xmax, ymax), color, 2)
                    det_label = labels_map[class_id] if args.labels else str(class_id)
                    cv2.putText(frame, det_label +' ' + str(round(obj[2] * 100, 1)) + ' %', (xmin, ymin - 7),
                                cv2.FONT_HERSHEY_COMPLEX, 0.6, color, 1)

            t2 = cv2.getTickCount()
            time1 = (t2 - t1) / freq
            frame_rate_calc = 1 / time1

            # Draw performance stats
            inf_time_message = "Inference time: N\A for async mode" if is_async_mode else \
                "Inference time: {:.3f} ms".format(det_time * 1000)
            render_time_message = "OpenCV rendering time: {:.3f} ms".format(render_time * 1000)
            FPS_message = "FPS: {:.2f}".format(frame_rate_calc)
            async_mode_message = "Async mode is on. Processing request {}".format(cur_request_id) if is_async_mode else \
                "Async mode is off. Processing request {}".format(cur_request_id)

            cv2.putText(frame, inf_time_message, (15, 15), cv2.FONT_HERSHEY_COMPLEX, 0.5, (200, 10, 10), 1)
            cv2.putText(frame, render_time_message, (15, 30), cv2.FONT_HERSHEY_COMPLEX, 0.5, (10, 10, 200), 1)
            cv2.putText(frame, FPS_message, (15, 45), cv2.FONT_HERSHEY_COMPLEX, 0.5, (10, 10, 200), 1)
            cv2.putText(frame, async_mode_message, (10, int(initial_h - 20)), cv2.FONT_HERSHEY_COMPLEX, 0.5,
                        (10, 10, 200), 1)
            if args.output:
                out.write(frame)
        #
        render_start = time.time()
        cv2.imshow("Detection Results", frame)
        render_end = time.time()
        render_time = render_end - render_start

        if is_async_mode:
            cur_request_id, next_request_id = next_request_id, cur_request_id
            frame = next_frame

        key = cv2.waitKey(1)
        if key == 27:
            break
        if key == 9:
            is_async_mode = not is_async_mode
            log.info("Switched to {} mode".format("async" if is_async_mode else "sync"))

    cap.release()
    if args.output:
        out.release()

    cv2.destroyAllWindows()
    del exec_net
    del plugin

if __name__ == '__main__':
    sys.exit(main() or 0)