basedoc/PyDetectionDNN_8py_source.html

import pyjevois

if pyjevois.pro: import libjevoispro as jevois

else: import libjevois as jevois

import cv2 as cv

import numpy as np

import sys


## Object detection and recognition using OpenCV Deep Neural Networks (DNN)

#

# This module runs an object detection deep neural network using the OpenCV DNN

# library. Detection networks analyze a whole scene and produce a number of

# bounding boxes around detected objects, together with identity labels

# and confidence scores for each detected box.

#

# This module supports detection networks implemented in TensorFlow, Caffe,

# Darknet, Torch, etc as supported by the OpenCV DNN module.

#

# Included with the standard JeVois distribution are:

#

# - OpenCV Face Detector, Caffe model

# - MobileNet + SSD trained on Pascal VOC (20 object classes), Caffe model

# - MobileNet + SSD trained on Coco (80 object classes), TensorFlow model

# - MobileNet v2 + SSD trained on Coco (80 object classes), TensorFlow model

# - Darknet Tiny YOLO v3 trained on Coco (80 object classes), Darknet model

# - Darknet Tiny YOLO v2 trained on Pascal VOC (20 object classes), Darknet model

#

# See the module's constructor (__init__) code and select a value for \b model to switch network. Object categories are

# as follows:

# - The 80 COCO object categories are: person, bicycle, car, motorbike, aeroplane, bus, train, truck, boat, traffic,

#   fire, stop, parking, bench, bird, cat, dog, horse, sheep, cow, elephant, bear, zebra, giraffe, backpack, umbrella,

#   handbag, tie, suitcase, frisbee, skis, snowboard, sports, kite, baseball, baseball, skateboard, surfboard, tennis,

#   bottle, wine, cup, fork, knife, spoon, bowl, banana, apple, sandwich, orange, broccoli, carrot, hot, pizza, donut,

#   cake, chair, sofa, pottedplant, bed, diningtable, toilet, tvmonitor, laptop, mouse, remote, keyboard, cell,

#   microwave, oven, toaster, sink, refrigerator, book, clock, vase, scissors, teddy, hair, toothbrush.

#

# - The 20 Pascal-VOC object categories are: aeroplane, bicycle, bird, boat, bottle, bus, car, cat, chair, cow,

#   diningtable, dog, horse, motorbike, person, pottedplant, sheep, sofa, train, tvmonitor.

#

# Sometimes it will make mistakes! The performance of yolov3-tiny is about 33.1% correct (mean average precision) on

# the COCO test set. The OpenCV Face Detector is quite fast and robust!

#

# This module is adapted from the sample OpenCV code:

# https://github.com/opencv/opencv/blob/master/samples/dnn/object_detection.py

#

# More pre-trained models are available on github in opencv_extra

#

#

# @author Laurent Itti

#

# @videomapping YUYV 640 502 20.0 YUYV 640 480 20.0 JeVois PyDetectionDNN

# @email itti@usc.edu

# @address 880 W 1st St Suite 807, Los Angeles CA 90012, USA

# @copyright Copyright (C) 2018 by Laurent Itti

# @mainurl http://jevois.org

# @supporturl http://jevois.org

# @otherurl http://jevois.org

# @license GPL v3

# @distribution Unrestricted

# @restrictions None

# @ingroup modules


class PyDetectionDNN:

    # ####################################################################################################

    ## Constructor


    def __init__(self):

        self.confThreshold = 0.5 # Confidence threshold (0..1), higher for stricter detection confidence.

        self.nmsThreshold = 0.4  # Non-maximum suppression threshold (0..1), higher to remove more duplicate boxes.

        self.inpWidth = 160      # Resized image width passed to network

        self.inpHeight = 120     # Resized image height passed to network

        self.scale = 2/255       # Value scaling factor applied to input pixels

        self.mean = [127.5, 127.5, 127.5] # Mean BGR value subtracted from input image

        self.rgb = True          # True if model expects RGB inputs, otherwise it expects BGR


        # Select one of the models:

        model = 'Face'              # OpenCV Face Detector, Caffe model

        #model = 'MobileNetV2SSD'   # MobileNet v2 + SSD trained on Coco (80 object classes), TensorFlow model

        #model = 'MobileNetSSD'     # MobileNet + SSD trained on Pascal VOC (20 object classes), Caffe model

        #model = 'MobileNetSSDcoco' # MobileNet + SSD trained on Coco (80 object classes), TensorFlow model

        #model = 'YOLOv3'           # Darknet Tiny YOLO v3 trained on Coco (80 object classes), Darknet model

        #model = 'YOLOv2'           # Darknet Tiny YOLO v2 trained on Pascal VOC (20 object classes), Darknet model


        # You should not have to edit anything beyond this point.

        backend = cv.dnn.DNN_BACKEND_OPENCV

        target = cv.dnn.DNN_TARGET_CPU

        self.classes = None

        classnames = None

        if (model == 'MobileNetSSD'):

            classnames = pyjevois.share + '/darknet/yolo/data/voc.names'

            modelname = pyjevois.share + '/opencv-dnn/detection/MobileNetSSD_deploy.caffemodel'

            configname = pyjevois.share + '/opencv-dnn/detection/MobileNetSSD_deploy.prototxt'

            self.rgb = False

        elif (model == 'MobileNetV2SSD'):

            classnames = pyjevois.share + '/darknet/yolo/data/coco.names'

            modelname = pyjevois.share + '/opencv-dnn/detection/ssd_mobilenet_v2_coco_2018_03_29.pb'

            configname = pyjevois.share + '/opencv-dnn/detection/ssd_mobilenet_v2_coco_2018_03_29.pbtxt'

        elif (model == 'MobileNetSSDcoco'):

            classnames = pyjevois.share + '/darknet/yolo/data/coco.names'

            modelname = pyjevois.share + '/opencv-dnn/detection/ssd_mobilenet_v1_coco_2017_11_17.pb'

            configname = pyjevois.share + '/opencv-dnn/detection/ssd_mobilenet_v1_coco_2017_11_17.pbtxt'

            self.rgb = False

            self.nmsThreshold = 0.1

        elif (model == 'YOLOv3'):

            classnames = pyjevois.share + '/darknet/yolo/data/coco.names'

            modelname = pyjevois.share + '/darknet/yolo/weights/yolov3-tiny.weights'

            configname = pyjevois.share + '/darknet/yolo/cfg/yolov3-tiny.cfg'

        elif (model == 'YOLOv2'):

            classnames = pyjevois.share + '/darknet/yolo/data/voc.names'

            modelname = pyjevois.share + '/darknet/yolo/weights/yolov2-tiny-voc.weights'

            configname = pyjevois.share + '/darknet/yolo/cfg/yolov2-tiny-voc.cfg'

            self.inpWidth = 320

            self.inpHeight = 240

        else:

            classnames = pyjevois.share + '/opencv-dnn/detection/opencv_face_detector.classes'

            modelname = pyjevois.share + '/opencv-dnn/detection/opencv_face_detector.caffemodel'

            configname = pyjevois.share + '/opencv-dnn/detection/opencv_face_detector.prototxt'

            self.scale = 1.0

            self.mean = [104.0, 177.0, 123.0]

            self.rgb = False


        # Load names of classes

        if classnames:

            with open(classnames, 'rt') as f:

                self.classes = f.read().rstrip('\n').split('\n')


        # Load a network

        self.net = cv.dnn.readNet(modelname, configname)

        self.net.setPreferableBackend(backend)

        self.net.setPreferableTarget(target)

        self.timer = jevois.Timer('Neural detection', 10, jevois.LOG_DEBUG)

        self.model = model

        self.outNames = self.net.getUnconnectedOutLayersNames()


    # ####################################################################################################

    ## Analyze and draw boxes, object names, and confidence scores


    def postprocess(self, frame, outs):

        frameHeight = frame.shape[0]

        frameWidth = frame.shape[1]


        def drawPred(classId, conf, left, top, right, bottom):

            # Draw a bounding box.

            cv.rectangle(frame, (left, top), (right, bottom), (0, 255, 0), 2)


            label = '%.2f' % (conf * 100)


            # Print a label of class.

            if self.classes:

                if (classId >= len(self.classes)):

                    label = 'Oooops id=%d: %s' % (classId, label)

                else:

                    label = '%s: %s' % (self.classes[classId], label)


            labelSize, baseLine = cv.getTextSize(label, cv.FONT_HERSHEY_SIMPLEX, 0.4, 1)

            top = max(top, labelSize[1])

            cv.rectangle(frame, (left, top - labelSize[1]-2), (left + labelSize[0], top + baseLine),

                         (255, 255, 255), cv.FILLED)

            cv.putText(frame, label, (left, top), cv.FONT_HERSHEY_SIMPLEX, 0.4, (0, 0, 0))


        layerNames = self.net.getLayerNames()

        lastLayerId = self.net.getLayerId(layerNames[-1])

        lastLayer = self.net.getLayer(lastLayerId)


        classIds = []

        confidences = []

        boxes = []

        if self.net.getLayer(0).outputNameToIndex('im_info') != -1:  # Faster-RCNN or R-FCN

            # Network produces output blob with a shape 1x1xNx7 where N is a number of

            # detections and an every detection is a vector of values

            # [batchId, classId, confidence, left, top, right, bottom]

            for out in outs:

                for detection in out[0, 0]:

                    confidence = detection[2]

                    if confidence > self.confThreshold:

                        left = int(detection[3])

                        top = int(detection[4])

                        right = int(detection[5])

                        bottom = int(detection[6])

                        width = right - left + 1

                        height = bottom - top + 1

                        classIds.append(int(detection[1]) - 1)  # Skip background label

                        confidences.append(float(confidence))

                        boxes.append([left, top, width, height])

        elif lastLayer.type == 'DetectionOutput':

            # Network produces output blob with a shape 1x1xNx7 where N is a number of

            # detections and an every detection is a vector of values

            # [batchId, classId, confidence, left, top, right, bottom]

            for out in outs:

                for detection in out[0, 0]:

                    confidence = detection[2]

                    if confidence > self.confThreshold:

                        left = int(detection[3] * frameWidth)

                        top = int(detection[4] * frameHeight)

                        right = int(detection[5] * frameWidth)

                        bottom = int(detection[6] * frameHeight)

                        width = right - left + 1

                        height = bottom - top + 1

                        classIds.append(int(detection[1]) - 1)  # Skip background label

                        confidences.append(float(confidence))

                        boxes.append([left, top, width, height])

        elif lastLayer.type == 'Region':

            # Network produces output blob with a shape NxC where N is a number of

            # detected objects and C is a number of classes + 4 where the first 4

            # numbers are [center_x, center_y, width, height]

            classIds = []

            confidences = []

            boxes = []

            for out in outs:

                for detection in out:

                    scores = detection[5:]

                    classId = np.argmax(scores)

                    confidence = scores[classId]

                    if confidence > self.confThreshold:

                        center_x = int(detection[0] * frameWidth)

                        center_y = int(detection[1] * frameHeight)

                        width = int(detection[2] * frameWidth)

                        height = int(detection[3] * frameHeight)

                        left = int(center_x - width / 2)

                        top = int(center_y - height / 2)

                        classIds.append(classId)

                        confidences.append(float(confidence))

                        boxes.append([left, top, width, height])

        else:

            jevois.LERROR('Unknown output layer type: ' + lastLayer.type)

            return


        # NMS is used inside Region layer only on DNN_BACKEND_OPENCV for another backends we need NMS in sample

        # or NMS is required if number of outputs > 1

        if len(self.outNames) > 1:

            indices = []

            classIds = np.array(classIds)

            boxes = np.array(boxes)

            confidences = np.array(confidences)

            unique_classes = set(classIds)

            for cl in unique_classes:

                class_indices = np.where(classIds == cl)[0]

                conf = confidences[class_indices]

                box  = boxes[class_indices].tolist()

                nms_indices = cv.dnn.NMSBoxes(box, conf, self.confThreshold, self.nmsThreshold)

                #nms_indices = nms_indices[:, 0] if len(nms_indices) else []

                indices.extend(class_indices[nms_indices])

        else:

            indices = np.arange(0, len(classIds))


        for i in indices:

            box = boxes[i]

            left = box[0]

            top = box[1]

            width = box[2]

            height = box[3]

            drawPred(classIds[i], confidences[i], left, top, left + width, top + height)


    # ####################################################################################################

    ## JeVois main processing function


    def process(self, inframe, outframe):

        frame = inframe.getCvBGR()

        self.timer.start()


        frameHeight = frame.shape[0]

        frameWidth = frame.shape[1]


        # Create a 4D blob from a frame.

        blob = cv.dnn.blobFromImage(frame, self.scale, (self.inpWidth, self.inpHeight), self.mean, self.rgb, crop=False)


        # Run a model

        self.net.setInput(blob)

        if self.net.getLayer(0).outputNameToIndex('im_info') != -1:  # Faster-RCNN or R-FCN

            frame = cv.resize(frame, (self.inpWidth, self.inpHeight))

            self.net.setInput(np.array([self.inpHeight, self.inpWidth, 1.6], dtype=np.float32), 'im_info')

        outs = self.net.forward(self.outNames)


        self.postprocess(frame, outs)


        # Create dark-gray (value 80) image for the bottom panel, 22 pixels tall:

        msgbox = np.zeros((22, frame.shape[1], 3), dtype = np.uint8) + 80


        # Put efficiency information.

        cv.putText(frame, 'JeVois Python Object Detection DNN - ' + self.model, (3, 15),

                   cv.FONT_HERSHEY_SIMPLEX, 0.4, (255, 255, 255), 1, cv.LINE_AA)

        t, _ = self.net.getPerfProfile()

        fps = self.timer.stop()

        label = fps + ' - Inference time: %.2fms' % (t * 1000.0 / cv.getTickFrequency())

        cv.putText(msgbox, label, (3, 15), cv.FONT_HERSHEY_SIMPLEX, 0.4, (255, 255, 255), 1, cv.LINE_AA)


        # Stack bottom panel below main image:

        frame = np.vstack((frame, msgbox))


        # Send output frame to host:

        outframe.sendCv(frame)


PyDetectionDNN.PyDetectionDNN
Object detection and recognition using OpenCV Deep Neural Networks (DNN)
Definition PyDetectionDNN.py:61

PyDetectionDNN.PyDetectionDNN.outNames
outNames
Definition PyDetectionDNN.py:130

PyDetectionDNN.PyDetectionDNN.__init__
__init__(self)
Constructor.
Definition PyDetectionDNN.py:64

PyDetectionDNN.PyDetectionDNN.timer
timer
Definition PyDetectionDNN.py:128

PyDetectionDNN.PyDetectionDNN.classes
classes
Definition PyDetectionDNN.py:84

PyDetectionDNN.PyDetectionDNN.mean
mean
Definition PyDetectionDNN.py:70

PyDetectionDNN.PyDetectionDNN.scale
scale
Definition PyDetectionDNN.py:69

PyDetectionDNN.PyDetectionDNN.inpHeight
inpHeight
Definition PyDetectionDNN.py:68

PyDetectionDNN.PyDetectionDNN.process
process(self, inframe, outframe)
JeVois main processing function.
Definition PyDetectionDNN.py:252

PyDetectionDNN.PyDetectionDNN.postprocess
postprocess(self, frame, outs)
Analyze and draw boxes, object names, and confidence scores.
Definition PyDetectionDNN.py:134

PyDetectionDNN.PyDetectionDNN.confThreshold
confThreshold
Definition PyDetectionDNN.py:65

PyDetectionDNN.PyDetectionDNN.net
net
Definition PyDetectionDNN.py:125

PyDetectionDNN.PyDetectionDNN.model
model
Definition PyDetectionDNN.py:129

PyDetectionDNN.PyDetectionDNN.nmsThreshold
nmsThreshold
Definition PyDetectionDNN.py:66

PyDetectionDNN.PyDetectionDNN.rgb
rgb
Definition PyDetectionDNN.py:71

PyDetectionDNN.PyDetectionDNN.inpWidth
inpWidth
Definition PyDetectionDNN.py:67

jevois::Timer