Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 1 | """ |
| 2 | SPDX-FileCopyrightText: 2020-present Open Networking Foundation <info@opennetworking.org> |
| 3 | SPDX-License-Identifier: LicenseRef-ONF-Member-1.01 |
| 4 | """ |
| 5 | |
| 6 | from __future__ import print_function |
| 7 | |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 8 | from collections import namedtuple |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 9 | import logging as log |
| 10 | import os |
| 11 | import sys |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 12 | from argparse import ArgumentParser, SUPPRESS |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 13 | from imutils import build_montages |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 14 | |
| 15 | import cv2 |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 16 | from openvino.inference_engine import IECore |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 17 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 18 | from base_camera import BaseCamera |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 19 | |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 20 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 21 | class Camera(BaseCamera): |
Shad Ansari | 5e8d069 | 2021-12-08 19:09:34 +0000 | [diff] [blame] | 22 | Shape = namedtuple('Shape', ['n','c','h','w']) |
Shad Ansari | d365451 | 2021-09-29 10:31:53 -0700 | [diff] [blame] | 23 | |
Shad Ansari | c0726e6 | 2021-10-04 22:38:53 +0000 | [diff] [blame] | 24 | def __init__(self, device, args): |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 25 | log.basicConfig(format="[ %(levelname)s ] %(message)s", level=log.INFO, stream=sys.stdout) |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 26 | |
Shad Ansari | c9f48d3 | 2021-10-25 19:03:34 +0000 | [diff] [blame] | 27 | self.model_xml = args.model |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 28 | self.input = args.input |
| 29 | self.prob_threshold = args.prob_threshold |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 30 | self.is_async_mode = True |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 31 | self.device = device |
| 32 | |
Shad Ansari | ec6bbd3 | 2021-12-10 20:57:16 +0000 | [diff] [blame] | 33 | super(Camera, self).__init__(device, args.key, args.mbrlow, args.mbrhigh, args.devicegroup, args.noroc) |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 34 | |
| 35 | def __del__(self): |
| 36 | # stream.release() |
| 37 | cv2.destroyAllWindows() |
| 38 | |
| 39 | def init_stream(self): |
| 40 | if self.input == 'cam': |
| 41 | input_stream = 0 |
| 42 | elif self.input == 'gstreamer': |
Shad Ansari | f763389 | 2021-11-02 19:31:00 +0000 | [diff] [blame] | 43 | input_stream = 'udpsrc port=500' + self.device + ' caps = " application/x-rtp, media=(string)video, clock-rate=(int)90000, encoding-name=(string)H264, payload=(int)96" ! rtph264depay ! avdec_h264 output-corrupt=false ! videoconvert ! appsink' |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 44 | else: |
| 45 | input_stream = self.input |
| 46 | assert os.path.isfile(self.input), "Specified input file doesn't exist" |
| 47 | |
| 48 | if self.input == 'gstreamer': |
| 49 | stream = cv2.VideoCapture(input_stream, cv2.CAP_GSTREAMER) |
| 50 | else: |
| 51 | stream = cv2.VideoCapture(input_stream) |
| 52 | |
| 53 | return stream |
| 54 | |
| 55 | |
| 56 | def init_inference(self): |
Shad Ansari | c9f48d3 | 2021-10-25 19:03:34 +0000 | [diff] [blame] | 57 | self.model_bin = os.path.splitext(self.model_xml)[0] + ".bin" |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 58 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 59 | # Read IR |
| 60 | log.info("Reading IR...") |
Shad Ansari | c9f48d3 | 2021-10-25 19:03:34 +0000 | [diff] [blame] | 61 | net = IECore().read_network(model=self.model_xml, weights=self.model_bin) |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 62 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 63 | assert len(net.inputs.keys()) == 1, "Demo supports only single input topologies" |
| 64 | assert len(net.outputs) == 1, "Demo supports only single output topologies" |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 65 | input_blob = next(iter(net.inputs)) |
| 66 | out_blob = next(iter(net.outputs)) |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 67 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 68 | log.info("Loading IR to the plugin...") |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 69 | exec_net = IECore().load_network(network=net, device_name="CPU", num_requests=2) |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 70 | # Read and pre-process input image |
Shad Ansari | 5e8d069 | 2021-12-08 19:09:34 +0000 | [diff] [blame] | 71 | shape = Camera.Shape(*net.inputs[input_blob].shape) |
Shad Ansari | c9f48d3 | 2021-10-25 19:03:34 +0000 | [diff] [blame] | 72 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 73 | del net |
Shad Ansari | d365451 | 2021-09-29 10:31:53 -0700 | [diff] [blame] | 74 | |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 75 | return exec_net, shape, input_blob, out_blob |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 76 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 77 | |
| 78 | def frames(self): |
Shad Ansari | 79615b9 | 2021-09-30 11:15:41 -0700 | [diff] [blame] | 79 | |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 80 | exec_net, shape, input_blob, out_blob = self.init_inference() |
| 81 | stream = self.init_stream() |
Shad Ansari | 79615b9 | 2021-09-30 11:15:41 -0700 | [diff] [blame] | 82 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 83 | cur_request_id = 0 |
| 84 | next_request_id = 1 |
| 85 | |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 86 | ret, frame = stream.read() |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 87 | |
| 88 | while True: |
| 89 | if self.is_async_mode: |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 90 | ret, next_frame = stream.read() |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 91 | else: |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 92 | ret, frame = stream.read() |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 93 | if not ret: |
| 94 | break |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 95 | initial_w = stream.get(cv2.CAP_PROP_FRAME_WIDTH) |
| 96 | initial_h = stream.get(cv2.CAP_PROP_FRAME_HEIGHT) |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 97 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 98 | # Main sync point: |
| 99 | # in the truly Async mode we start the NEXT infer request, while waiting for the CURRENT to complete |
| 100 | # in the regular mode we start the CURRENT request and immediately wait for it's completion |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 101 | if self.is_async_mode: |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 102 | in_frame = cv2.resize(next_frame, (shape.w, shape.h)) |
Shad Ansari | 341ca3a | 2021-09-30 12:10:00 -0700 | [diff] [blame] | 103 | in_frame = in_frame.transpose((2, 0, 1)) # Change data layout from HWC to CHW |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 104 | in_frame = in_frame.reshape((shape.n, shape.c, shape.h, shape.w)) |
| 105 | exec_net.start_async(request_id=next_request_id, inputs={input_blob: in_frame}) |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 106 | else: |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 107 | in_frame = cv2.resize(frame, (shape.w, shape.h)) |
Shad Ansari | 341ca3a | 2021-09-30 12:10:00 -0700 | [diff] [blame] | 108 | in_frame = in_frame.transpose((2, 0, 1)) # Change data layout from HWC to CHW |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 109 | in_frame = in_frame.reshape((shape.n, shape.c, shape.h, shape.w)) |
| 110 | exec_net.start_async(request_id=cur_request_id, inputs={input_blob: in_frame}) |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 111 | |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 112 | if exec_net.requests[cur_request_id].wait(-1) == 0: |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 113 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 114 | # Parse detection results of the current request |
Shad Ansari | a271465 | 2021-10-23 00:10:18 +0000 | [diff] [blame] | 115 | res = exec_net.requests[cur_request_id].outputs[out_blob] |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 116 | |
Shad Ansari | 0bee2f8 | 2021-10-25 20:07:22 +0000 | [diff] [blame] | 117 | initial_w = 640 |
| 118 | initial_h = 480 |
| 119 | frame = cv2.resize(frame, (initial_w, initial_h)) |
| 120 | |
Shad Ansari | 51554d8 | 2021-10-26 20:42:18 +0000 | [diff] [blame] | 121 | obj_count = 0 |
| 122 | red = (0, 0, 255) |
| 123 | black = (0, 0, 0) |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 124 | for obj in res[0][0]: |
| 125 | # Draw only objects when probability more than specified threshold |
Shad Ansari | 4ae1168 | 2021-10-22 18:51:53 +0000 | [diff] [blame] | 126 | if obj[2] > self.prob_threshold: |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 127 | xmin = int(obj[3] * initial_w) |
| 128 | ymin = int(obj[4] * initial_h) |
| 129 | xmax = int(obj[5] * initial_w) |
| 130 | ymax = int(obj[6] * initial_h) |
Shad Ansari | 51554d8 | 2021-10-26 20:42:18 +0000 | [diff] [blame] | 131 | # Draw box and prob |
| 132 | cv2.rectangle(frame, (xmin, ymin), (xmax, ymax), red, 2) |
| 133 | cv2.putText(frame, str(round(obj[2] * 100, 1)) + ' %', (xmin, ymin - 7), |
| 134 | cv2.FONT_HERSHEY_COMPLEX, 0.6, black, 1) |
| 135 | obj_count += 1 |
Shad Ansari | 47432b6 | 2021-09-27 22:46:25 +0000 | [diff] [blame] | 136 | |
Shad Ansari | 51554d8 | 2021-10-26 20:42:18 +0000 | [diff] [blame] | 137 | cv2.putText(frame, "persons: {}".format(str(obj_count)), (10, 20), |
| 138 | cv2.FONT_HERSHEY_COMPLEX, 0.6, black, 1) |
| 139 | cv2.putText(frame, "camera: {}".format(self.device), (10, int(initial_h - 20)), |
| 140 | cv2.FONT_HERSHEY_COMPLEX, 0.6, black, 1) |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 141 | |
Shad Ansari | 3a8a391 | 2021-11-18 00:44:50 +0000 | [diff] [blame] | 142 | if obj_count > 0: |
Shad Ansari | 5e8d069 | 2021-12-08 19:09:34 +0000 | [diff] [blame] | 143 | self.person_detected(obj_count) |
Shad Ansari | 3a8a391 | 2021-11-18 00:44:50 +0000 | [diff] [blame] | 144 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 145 | yield cv2.imencode('.jpg', frame)[1].tobytes() |
| 146 | |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 147 | if self.is_async_mode: |
| 148 | cur_request_id, next_request_id = next_request_id, cur_request_id |
Shad Ansari | 30a2373 | 2021-09-29 23:07:21 -0700 | [diff] [blame] | 149 | frame = next_frame |