blob: 29aef27af3c71131469458c23c70de1eb20d6e5c [file] [log] [blame]
Shad Ansari47432b62021-09-27 22:46:25 +00001"""
2SPDX-FileCopyrightText: 2020-present Open Networking Foundation <info@opennetworking.org>
3SPDX-License-Identifier: LicenseRef-ONF-Member-1.01
4"""
5
6from __future__ import print_function
7
Shad Ansarid3654512021-09-29 10:31:53 -07008import cv2
Shad Ansari47432b62021-09-27 22:46:25 +00009import logging as log
10import os
11import sys
12import time
13from argparse import ArgumentParser, SUPPRESS
Shad Ansari47432b62021-09-27 22:46:25 +000014from imutils import build_montages
15from openvino.inference_engine import IECore
Shad Ansari30a23732021-09-29 23:07:21 -070016from base_camera import BaseCamera
Shad Ansari47432b62021-09-27 22:46:25 +000017
Shad Ansari4ae11682021-10-22 18:51:53 +000018DEFAULT_PROB_THRESH = 0.5
Shad Ansari47432b62021-09-27 22:46:25 +000019
20def build_argparser():
21 parser = ArgumentParser(add_help=False)
22 args = parser.add_argument_group('Options')
23 args.add_argument('-h', '--help', action='help', default=SUPPRESS, help='Show this help message and exit.')
24 args.add_argument("-m", "--model", help="Required. Path to an .xml file with a trained model.",
25 required=True, type=str)
26 args.add_argument("-i", "--input",
27 help="Required. Path to video file or image. 'cam' for capturing video stream from camera",
28 required=True, type=str)
Shad Ansari47432b62021-09-27 22:46:25 +000029 args.add_argument("-l", "--cpu_extension",
30 help="Optional. Required for CPU custom layers. Absolute path to a shared library with the "
31 "kernels implementations.", type=str, default=None)
32 args.add_argument("-pp", "--plugin_dir", help="Optional. Path to a plugin folder", type=str, default=None)
33 args.add_argument("-d", "--device",
34 help="Optional. Specify the target device to infer on; CPU, GPU, FPGA, HDDL or MYRIAD is "
35 "acceptable. The demo will look for a suitable plugin for device specified. "
36 "Default value is CPU", default="CPU", type=str)
37 args.add_argument("--labels", help="Optional. Path to labels mapping file", default=None, type=str)
38 args.add_argument("-pt", "--prob_threshold", help="Optional. Probability threshold for detections filtering",
Shad Ansari4ae11682021-10-22 18:51:53 +000039 default=DEFAULT_PROB_THRESH, type=float)
Shad Ansari47432b62021-09-27 22:46:25 +000040 args.add_argument("-ns", help='No show output', action='store_true')
41
42 return parser
43
44
Shad Ansari30a23732021-09-29 23:07:21 -070045class Camera(BaseCamera):
Shad Ansari4ae11682021-10-22 18:51:53 +000046 prob_threshold = DEFAULT_PROB_THRESH
Shad Ansarid3654512021-09-29 10:31:53 -070047
Shad Ansaric0726e62021-10-04 22:38:53 +000048 def __init__(self, device, args):
Shad Ansari30a23732021-09-29 23:07:21 -070049 log.basicConfig(format="[ %(levelname)s ] %(message)s", level=log.INFO, stream=sys.stdout)
50 model_xml = args.model
51 model_bin = os.path.splitext(model_xml)[0] + ".bin"
Shad Ansari47432b62021-09-27 22:46:25 +000052
Shad Ansari30a23732021-09-29 23:07:21 -070053 # Read IR
54 log.info("Reading IR...")
55 net = IECore().read_network(model=model_xml, weights=model_bin)
Shad Ansari47432b62021-09-27 22:46:25 +000056
Shad Ansari30a23732021-09-29 23:07:21 -070057 assert len(net.inputs.keys()) == 1, "Demo supports only single input topologies"
58 assert len(net.outputs) == 1, "Demo supports only single output topologies"
59 self.input_blob = next(iter(net.inputs))
60 self.out_blob = next(iter(net.outputs))
Shad Ansari47432b62021-09-27 22:46:25 +000061
Shad Ansari30a23732021-09-29 23:07:21 -070062 log.info("Loading IR to the plugin...")
63 self.exec_net = IECore().load_network(network=net, device_name=args.device, num_requests=2)
64 # Read and pre-process input image
65 self.n, self.c, self.h, self.w = net.inputs[self.input_blob].shape
66 del net
67 if args.input == 'cam':
Shad Ansari79615b92021-09-30 11:15:41 -070068 self.input_stream = 0
Shad Ansari30a23732021-09-29 23:07:21 -070069 elif args.input == 'gstreamer':
Shad Ansari7f9a4512021-10-12 00:14:58 +000070 # M-JPEG
71 # self.input_stream = 'udpsrc port=500' + device + ' caps = " application/x-rtp, encoding-name=JPEG,payload=26" ! rtpjpegdepay ! decodebin ! videoconvert ! appsink'
72 # H.264
73 self.input_stream = 'udpsrc port=500' + device + ' caps = " application/x-rtp, media=(string)video, clock-rate=(int)90000, encoding-name=(string)H264, payload=(int)96" ! rtph264depay ! avdec_h264 ! videoconvert ! appsink'
Shad Ansaric0726e62021-10-04 22:38:53 +000074 print("input_stream:", self.input_stream)
Shad Ansari47432b62021-09-27 22:46:25 +000075 else:
Shad Ansari341ca3a2021-09-30 12:10:00 -070076 self.input_stream = args.input
Shad Ansari30a23732021-09-29 23:07:21 -070077 assert os.path.isfile(args.input), "Specified input file doesn't exist"
Shad Ansarid3654512021-09-29 10:31:53 -070078
Shad Ansari30a23732021-09-29 23:07:21 -070079 if args.labels:
80 with open(args.labels, 'r') as f:
81 self.labels_map = [x.strip() for x in f]
82 else:
83 self.labels_map = None
Shad Ansari47432b62021-09-27 22:46:25 +000084
Shad Ansari30a23732021-09-29 23:07:21 -070085 self.args = args
Shad Ansari4ae11682021-10-22 18:51:53 +000086 self.prob_threshold = args.prob_threshold
Shad Ansari47432b62021-09-27 22:46:25 +000087
Shad Ansari4ae11682021-10-22 18:51:53 +000088 super(Camera, self).__init__(device, args.idle)
Shad Ansari47432b62021-09-27 22:46:25 +000089
Shad Ansari30a23732021-09-29 23:07:21 -070090 def __del__(self):
91 self.cap.release()
92 cv2.destroyAllWindows()
93
94 def frames(self):
Shad Ansari79615b92021-09-30 11:15:41 -070095
96 if self.input_stream == 'gstreamer':
97 self.cap = cv2.VideoCapture(self.input_stream, cv2.CAP_GSTREAMER)
98 else:
99 self.cap = cv2.VideoCapture(self.input_stream)
100
Shad Ansari30a23732021-09-29 23:07:21 -0700101 cur_request_id = 0
102 next_request_id = 1
103
104 log.info("Starting inference in async mode...")
105 log.info("To switch between sync and async modes press Tab button")
106 log.info("To stop the demo execution press Esc button")
107
108 # Async doesn't work if True
109 # Request issues = Runtime Error: [REQUEST BUSY]
Shad Ansarief185d22021-10-14 17:49:26 +0000110 # self.is_async_mode = False
111 self.is_async_mode = True
Shad Ansari30a23732021-09-29 23:07:21 -0700112 render_time = 0
113 ret, frame = self.cap.read()
114
Shad Ansari30a23732021-09-29 23:07:21 -0700115 print("To close the application, press 'CTRL+C' or any key with focus on the output window")
116
117 while True:
118 if self.is_async_mode:
119 ret, next_frame = self.cap.read()
Shad Ansari47432b62021-09-27 22:46:25 +0000120 else:
Shad Ansari30a23732021-09-29 23:07:21 -0700121 ret, frame = self.cap.read()
122 if not ret:
123 break
Shad Ansarief185d22021-10-14 17:49:26 +0000124 initial_w = self.cap.get(cv2.CAP_PROP_FRAME_WIDTH)
125 initial_h = self.cap.get(cv2.CAP_PROP_FRAME_HEIGHT)
Shad Ansari47432b62021-09-27 22:46:25 +0000126
Shad Ansari30a23732021-09-29 23:07:21 -0700127 # Main sync point:
128 # in the truly Async mode we start the NEXT infer request, while waiting for the CURRENT to complete
129 # in the regular mode we start the CURRENT request and immediately wait for it's completion
130 inf_start = time.time()
131 if self.is_async_mode:
Shad Ansari341ca3a2021-09-30 12:10:00 -0700132 in_frame = cv2.resize(next_frame, (self.w, self.h))
133 in_frame = in_frame.transpose((2, 0, 1)) # Change data layout from HWC to CHW
134 in_frame = in_frame.reshape((self.n, self.c, self.h, self.w))
135 self.exec_net.start_async(request_id=next_request_id, inputs={self.input_blob: in_frame})
Shad Ansari30a23732021-09-29 23:07:21 -0700136 else:
Shad Ansari341ca3a2021-09-30 12:10:00 -0700137 in_frame = cv2.resize(frame, (self.w, self.h))
138 in_frame = in_frame.transpose((2, 0, 1)) # Change data layout from HWC to CHW
139 in_frame = in_frame.reshape((self.n, self.c, self.h, self.w))
140 self.exec_net.start_async(request_id=cur_request_id, inputs={self.input_blob: in_frame})
Shad Ansari47432b62021-09-27 22:46:25 +0000141
Shad Ansari30a23732021-09-29 23:07:21 -0700142 if self.exec_net.requests[cur_request_id].wait(-1) == 0:
143 inf_end = time.time()
144 det_time = inf_end - inf_start
Shad Ansari47432b62021-09-27 22:46:25 +0000145
Shad Ansari30a23732021-09-29 23:07:21 -0700146 # Parse detection results of the current request
147 res = self.exec_net.requests[cur_request_id].outputs[self.out_blob]
Shad Ansari47432b62021-09-27 22:46:25 +0000148
Shad Ansari30a23732021-09-29 23:07:21 -0700149 for obj in res[0][0]:
150 # Draw only objects when probability more than specified threshold
Shad Ansari4ae11682021-10-22 18:51:53 +0000151 if obj[2] > self.prob_threshold:
Shad Ansari30a23732021-09-29 23:07:21 -0700152 xmin = int(obj[3] * initial_w)
153 ymin = int(obj[4] * initial_h)
154 xmax = int(obj[5] * initial_w)
155 ymax = int(obj[6] * initial_h)
156 class_id = int(obj[1])
157 # Draw box and label\class_id
Shad Ansarief185d22021-10-14 17:49:26 +0000158 color = (0, 0, 255)
Shad Ansari30a23732021-09-29 23:07:21 -0700159 cv2.rectangle(frame, (xmin, ymin), (xmax, ymax), color, 2)
160 det_label = self.labels_map[class_id] if self.labels_map else str(class_id)
161 cv2.putText(frame, det_label + ' ' + str(round(obj[2] * 100, 1)) + ' %', (xmin, ymin - 7),
162 cv2.FONT_HERSHEY_COMPLEX, 0.6, color, 1)
Shad Ansari341ca3a2021-09-30 12:10:00 -0700163 # print('Object detected, class_id:', class_id, 'probability:', obj[2], 'xmin:', xmin, 'ymin:', ymin,
164 # 'xmax:', xmax, 'ymax:', ymax)
Shad Ansari47432b62021-09-27 22:46:25 +0000165
Shad Ansaric0726e62021-10-04 22:38:53 +0000166 cv2.putText(frame, self.device, (10, int(initial_h - 20)),
167 cv2.FONT_HERSHEY_COMPLEX, 0.5, (10, 10, 200), 1)
Shad Ansari30a23732021-09-29 23:07:21 -0700168
169 render_start = time.time()
170
171 yield cv2.imencode('.jpg', frame)[1].tobytes()
172
Shad Ansari341ca3a2021-09-30 12:10:00 -0700173 render_end = time.time()
174 render_time = render_end - render_start
Shad Ansari30a23732021-09-29 23:07:21 -0700175
176 if self.is_async_mode:
177 cur_request_id, next_request_id = next_request_id, cur_request_id
Shad Ansari30a23732021-09-29 23:07:21 -0700178 frame = next_frame
Shad Ansari47432b62021-09-27 22:46:25 +0000179
180
181if __name__ == '__main__':
Shad Ansari30a23732021-09-29 23:07:21 -0700182 args = build_argparser().parse_args()
183 camera = Camera(args)
184 camera.frames()
185 del camera