From 15564efdbb9566a6fb4b3b496b029b3bf8362dc0 Mon Sep 17 00:00:00 2001
From: ioir123ju <549981178@qq.com>
Date: Wed, 17 Jun 2020 11:47:00 +0800
Subject: [PATCH 1/5] [ADD] Add a python demo.

---
 README.md                   |   6 ++
 darknetTR.py                | 185 ++++++++++++++++++++++++++++++++++++
 demo/demo/darknetTR.cpp     | 100 +++++++++++++++++++
 demo/demo/darknetTR.h       |  37 ++++++++
 demo/demo/demo.cpp          |   2 +-
 include/tkDNN/DetectionNN.h |  14 ++-
 6 files changed, 342 insertions(+), 2 deletions(-)
 create mode 100644 darknetTR.py
 create mode 100644 demo/demo/darknetTR.cpp
 create mode 100644 demo/demo/darknetTR.h
diff --git a/README.md b/README.md
index 19b98a28..66459a26 100644
--- a/README.md
+++ b/README.md
@@ -183,6 +183,12 @@ rm yolo3_fp32.rt        # be sure to delete(or move) old tensorRT files
 ./test_yolo3            # run the yolo test (is slow)
 ./demo yolo3_fp32.rt ../demo/yolo_test.mp4 y
 ```
+
+To run the an object detection demo with python (example with yolov4):
+```
+python darknetTR.py build/yolo4_fp16.rt --video=demo/yolo_test.mp4
+```
+
 In general the demo program takes 4 parameters:
 ```
 ./demo <network-rt-file> <path-to-video> <kind-of-network> <number-of-classes> <n-batches> <show-flag>
diff --git a/darknetTR.py b/darknetTR.py
new file mode 100644
index 00000000..d0800825
--- /dev/null
+++ b/darknetTR.py
@@ -0,0 +1,185 @@
+#!/usr/bin/env python
+# -*- encoding: utf-8 -*-
+"""
+@File    :   darknetTR.py.py
+@Contact :   JZ
+
+@Modify Time      @Author    @Version    @Desciption
+------------      -------    --------    -----------
+2020/6/12 14:40   JZ      1.0         None
+"""
+
+from ctypes import *
+import cv2
+import numpy as np
+import argparse
+import os
+from threading import Thread
+import time
+
+class IMAGE(Structure):
+    _fields_ = [("w", c_int),
+                ("h", c_int),
+                ("c", c_int),
+                ("data", POINTER(c_float))]
+
+class BOX(Structure):
+    _fields_ = [("x", c_float),
+                ("y", c_float),
+                ("w", c_float),
+                ("h", c_float)]
+
+class DETECTION(Structure):
+    _fields_ = [("cl", c_int),
+                ("bbox", BOX),
+                ("prob", c_float),
+                ("name", c_char*20),
+                ]
+
+lib = CDLL("./build/libdarknetTR.so", RTLD_GLOBAL)
+
+load_network = lib.load_network
+load_network.argtypes = [c_char_p, c_int, c_int]
+load_network.restype = c_void_p
+
+copy_image_from_bytes = lib.copy_image_from_bytes
+copy_image_from_bytes.argtypes = [IMAGE,c_char_p]
+
+make_image = lib.make_image
+make_image.argtypes = [c_int, c_int, c_int]
+make_image.restype = IMAGE
+
+do_inference = lib.do_inference
+do_inference.argtypes = [c_void_p, IMAGE]
+
+get_network_boxes = lib.get_network_boxes
+get_network_boxes.argtypes = [c_void_p, c_float, c_int, POINTER(c_int)]
+get_network_boxes.restype = POINTER(DETECTION)
+
+# cfg = 'yolo4_fp16.rt'
+# netMain = load_network(cfg.encode("ascii"), 80, 1)  # batch size = 1
+#
+#
+# darknet_image = make_image(512, 512, 3)
+# image = cv2.imread('/home/juzheng/dataset/mask/image/20190821004325_55.jpg')
+# frame_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+# image = cv2.resize(frame_rgb,
+#                    (512, 512),
+#                    interpolation=cv2.INTER_LINEAR)
+#
+# # frame_data = np.asarray(image, dtype=np.uint8)
+# # print(frame_data.shape)
+# frame_data = image.ctypes.data_as(c_char_p)
+# copy_image_from_bytes(darknet_image, frame_data)
+#
+# num = c_int(0)
+#
+# pnum = pointer(num)
+# do_inference(netMain, darknet_image)
+# dets = get_network_boxes(netMain, 0.5, 0, pnum)
+# print('end')
+# print(dets[0].cl, dets[0].prob)
+
+def detect_image(net, meta, darknet_image, thresh=.5):
+    num = c_int(0)
+
+    pnum = pointer(num)
+    do_inference(net, darknet_image)
+    dets = get_network_boxes(net, 0.5, 0, pnum)
+    res = []
+    for i in range(pnum[0]):
+        b = dets[i].bbox
+        res.append((dets[i].name.decode("ascii"), dets[i].prob, (b.x, b.y, b.w, b.h)))
+
+    return res
+
+
+def loop_detect(detect_m, video_path):
+    stream = cv2.VideoCapture(video_path)
+    start = time.time()
+    cnt = 0
+    while stream.isOpened():
+        ret, image = stream.read()
+        if ret is False:
+            break
+        frame_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+        image = cv2.resize(frame_rgb,
+                           (512, 512),
+                           interpolation=cv2.INTER_LINEAR)
+        detections = detect_m.detect(image, need_resize=False)
+        cnt += 1
+        for det in detections:
+            print(det)
+    end = time.time()
+    print("frame:{},time:{:.3f},FPS:{:.2f}".format(cnt, end-start, cnt/(end-start)))
+    stream.release()
+
+
+# class myThread(threading.Thread):
+#    def __init__(self, func, args):
+#       threading.Thread.__init__(self)
+#       self.func = func
+#       self.args = args
+#    def run(self):
+#       # print ("Starting " + self.args[0])
+#       self.func(*self.args)
+#       print ("Exiting " )
+
+
+class YOLO4RT(object):
+    def __init__(self,
+                 input_size=512,
+                 weight_file='./yolo4_fp16.rt',
+                 metaPath='Models/yolo4/coco.data',
+                 nms=0.2,
+                 conf_thres=0.3,
+                 device='cuda'):
+        self.input_size = input_size
+        self.metaMain =None
+        self.model = load_network(weight_file.encode("ascii"), 80, 1)
+        self.darknet_image = make_image(input_size, input_size, 3)
+        self.thresh = conf_thres
+        # self.resize_fn = ResizePadding(input_size, input_size)
+        # self.transf_fn = transforms.ToTensor()
+
+    def detect(self, image, need_resize=True, expand_bb=5):
+        try:
+            if need_resize:
+                frame_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+                image = cv2.resize(frame_rgb,
+                                   (self.input_size, self.input_size),
+                                   interpolation=cv2.INTER_LINEAR)
+            frame_data = image.ctypes.data_as(c_char_p)
+
+            copy_image_from_bytes(self.darknet_image, frame_data)
+
+            detections = detect_image(self.model, self.metaMain, self.darknet_image, thresh=self.thresh)
+
+            # cvDrawBoxes(detections, image)
+            # cv2.imshow("1", image)
+            # cv2.waitKey(1)
+            # detections = self.filter_results(detections, "person")
+            return detections
+        except Exception as e_s:
+            print(e_s)
+
+def parse_args():
+    parser = argparse.ArgumentParser(description='tkDNN detect')
+    parser.add_argument('weight', help='rt file path')
+    parser.add_argument('--video',  type=str, help='video path')
+    args = parser.parse_args()
+
+    return args
+
+
+
+if __name__ == '__main__':
+    args = parse_args()
+    detect_m = YOLO4RT(weight_file=args.weight)
+    t = Thread(target=loop_detect, args=(detect_m, args.video), daemon=True)
+
+    # thread1 = myThread(loop_detect, [detect_m])
+
+    # Start new Threads
+    t.start()
+    t.join()
\ No newline at end of file
diff --git a/demo/demo/darknetTR.cpp b/demo/demo/darknetTR.cpp
new file mode 100644
index 00000000..b64ccfba
--- /dev/null
+++ b/demo/demo/darknetTR.cpp
@@ -0,0 +1,100 @@
+#include "darknetTR.h"
+
+bool gRun;
+bool SAVE_RESULT = false;
+
+void sig_handler(int signo) {
+    std::cout<<"request gateway stop\n";
+    gRun = false;
+}
+
+extern "C"
+{
+
+
+void copy_image_from_bytes(image im, unsigned char *pdata)
+{
+//    unsigned char *data = (unsigned char*)pdata;
+//    int i, k, j;
+    int w = im.w;
+    int h = im.h;
+    int c = im.c;
+//    for (k = 0; k < c; ++k) {
+//        for (j = 0; j < h; ++j) {
+//            for (i = 0; i < w; ++i) {
+//                int dst_index = i + w * j + w * h*k;
+//                int src_index = k + c * i + c * w*j;
+//                im.data[dst_index] = (float)data[src_index] / 255.;
+//            }
+//        }
+//    }
+    memcpy(im.data, pdata, h * w * c);
+
+}
+
+image make_empty_image(int w, int h, int c)
+{
+    image out;
+    out.data = 0;
+    out.h = h;
+    out.w = w;
+    out.c = c;
+    return out;
+}
+
+image make_image(int w, int h, int c)
+{
+    image out = make_empty_image(w,h,c);
+    out.data = (float*)xcalloc(h * w * c, sizeof(float));
+    return out;
+}
+
+tk::dnn::Yolo3Detection* load_network(char* net_cfg, int n_classes, int n_batch)
+{
+    std::string net;
+    net = net_cfg;
+    tk::dnn::Yolo3Detection *detNN = new tk::dnn::Yolo3Detection;
+    detNN->init(net, n_classes, n_batch);
+
+    return detNN;
+}
+#include <typeinfo>
+void do_inference(tk::dnn::Yolo3Detection *net, image im)
+{
+    std::vector<cv::Mat> batch_dnn_input;
+
+    cv::Mat frame(im.h, im.w, CV_8UC3, (unsigned char*)im.data);
+    batch_dnn_input.push_back(frame);
+    net->update(batch_dnn_input, 1);
+
+}
+
+
+detection* get_network_boxes(tk::dnn::Yolo3Detection *net, float thresh, int batch_num, int *pnum)
+{
+    std::vector<std::vector<tk::dnn::box>> batchDetected;
+    batchDetected = net->get_batch_detected();
+    int nboxes =0;
+    std::vector<std::string> classesName = net->get_classesName();
+    detection* dets = (detection*)xcalloc(batchDetected[batch_num].size(), sizeof(detection));
+    for (int i = 0; i < batchDetected[batch_num].size(); ++i)
+    {
+        if (batchDetected[batch_num][i].prob > thresh)
+        {
+            dets[nboxes].cl = batchDetected[batch_num][i].cl;
+            strcpy(dets[nboxes].name,classesName[dets[nboxes].cl].c_str());
+            dets[nboxes].bbox.x = batchDetected[batch_num][i].x;
+            dets[nboxes].bbox.y = batchDetected[batch_num][i].y;
+            dets[nboxes].bbox.w = batchDetected[batch_num][i].w;
+            dets[nboxes].bbox.h = batchDetected[batch_num][i].h;
+            dets[nboxes].prob = batchDetected[batch_num][i].prob;
+            nboxes += 1;
+        }
+    }
+    if (pnum) *pnum = nboxes;
+    return dets;
+}
+}
+
+
+
diff --git a/demo/demo/darknetTR.h b/demo/demo/darknetTR.h
new file mode 100644
index 00000000..07ce0365
--- /dev/null
+++ b/demo/demo/darknetTR.h
@@ -0,0 +1,37 @@
+#ifndef DEMO_H
+#define DEMO_H
+
+#include <iostream>
+#include <signal.h>
+#include <stdlib.h>     /* srand, rand */
+#include <unistd.h>
+#include <mutex>
+#include <malloc.h>
+#include "CenternetDetection.h"
+#include "MobilenetDetection.h"
+#include "Yolo3Detection.h"
+#include "utils.h"
+extern "C"
+{
+typedef struct {
+    int w;
+    int h;
+    int c;
+    float *data;
+} image;
+
+typedef struct {
+    float x, y, w, h;
+}BOX;
+
+typedef struct {
+    int cl;
+    BOX bbox;
+    float prob;
+    char name[20];
+
+}detection;
+
+tk::dnn::Yolo3Detection* load_network(char* net_cfg, int n_classes, int n_batch);
+}
+#endif /* DETECTIONNN_H*/
\ No newline at end of file
diff --git a/demo/demo/demo.cpp b/demo/demo/demo.cpp
index 76b451d8..582b23c1 100644
--- a/demo/demo/demo.cpp
+++ b/demo/demo/demo.cpp
@@ -37,7 +37,7 @@ int main(int argc, char *argv[]) {
     int n_batch = 1;
     if(argc > 5)
         n_batch = atoi(argv[5]); 
-    bool show = true;
+    bool show = false;
     if(argc > 6)
         show = atoi(argv[6]); 
 
diff --git a/include/tkDNN/DetectionNN.h b/include/tkDNN/DetectionNN.h
index 030cf8f9..93ce949c 100644
--- a/include/tkDNN/DetectionNN.h
+++ b/include/tkDNN/DetectionNN.h
@@ -138,7 +138,19 @@ class DetectionNN {
                 TKDNN_TSTOP
                 if(save_times) *times<<t_ns<<"\n";
             }
-        }      
+        }
+        /**
+         * Method to get results.
+         *
+         */
+        std::vector<std::vector<tk::dnn::box>>& get_batch_detected()
+        {
+            return batchDetected;
+        }
+        std::vector<std::string> get_classesName()
+        {
+            return classesNames;
+        }
 
         /**
          * Method to draw boundixg boxes and labels on a frame.

From 40d3018a3e6fa8c699da6878de87afa394d0b0a0 Mon Sep 17 00:00:00 2001
From: ioir123ju <549981178@qq.com>
Date: Wed, 17 Jun 2020 16:32:56 +0800
Subject: [PATCH 2/5] [CHG] Add lib of demo.

---
 CMakeLists.txt | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 8c8619d1..06bcb2dc 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -113,6 +113,14 @@ target_link_libraries(map_demo tkDNN)
 add_executable(demo demo/demo/demo.cpp)
 target_link_libraries(demo tkDNN)
 
+option(BUILD_SHARED_LIBS "Specifies the type of libraries (SHARED or STATIC) to build" ON)
+if (BUILD_SHARED_LIBS)
+    add_library(darknetTR SHARED demo/demo/darknetTR.cpp)
+    target_compile_definitions(darknetTR PRIVATE LIB_EXPORTS=1)
+    target_compile_definitions(darknetTR PRIVATE -DDEMO_EXPORTS)
+    target_link_libraries(darknetTR tkDNN)
+endif()
+
 #-------------------------------------------------------------------------------
 # Install
 #-------------------------------------------------------------------------------

From d07db44bcb04eb177d9ad289694d8ebe5daa9a4b Mon Sep 17 00:00:00 2001
From: ioir123ju <549981178@qq.com>
Date: Wed, 17 Jun 2020 16:58:57 +0800
Subject: [PATCH 3/5] [CHG] ADD xcalloc

---
 include/tkDNN/utils.h | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/include/tkDNN/utils.h b/include/tkDNN/utils.h
index aa73e9ed..d419920f 100644
--- a/include/tkDNN/utils.h
+++ b/include/tkDNN/utils.h
@@ -6,7 +6,7 @@
 #include <fstream>
 #include <iomanip>
 #include <stdlib.h>
-
+#include <malloc.h>
 #include "cuda.h"
 #include "cuda_runtime_api.h"
 #include <cublas_v2.h>
@@ -101,6 +101,12 @@ typedef enum {
   ERROR_CUDNNvsTENSORRT = 8    
 } resultError_t;
 
+void *xmalloc(size_t size);
+void *xcalloc(size_t nmemb, size_t size);
+void malloc_error();
+void calloc_error();
+void realloc_error();
+
 void printCenteredTitle(const char *title, char fill, int dim = 30);
 bool fileExist(const char *fname);
 void downloadWeightsifDoNotExist(const std::string& input_bin, const std::string& test_folder, const std::string& weights_url);

From 95daadcec296f7868cdcbc244d1d83dc0c4bef7f Mon Sep 17 00:00:00 2001
From: ioir123ju <549981178@qq.com>
Date: Wed, 17 Jun 2020 18:37:47 +0800
Subject: [PATCH 4/5] [CHG] ADD xcalloc define

---
 src/utils.cpp | 42 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 42 insertions(+)

diff --git a/src/utils.cpp b/src/utils.cpp
index 65030f06..9c6c5f20 100644
--- a/src/utils.cpp
+++ b/src/utils.cpp
@@ -1,6 +1,48 @@
 #include "utils.h"
 #include <string.h>
 
+void *xmalloc(size_t size) {
+    void *ptr=malloc(size);
+    if(!ptr) {
+        malloc_error();
+    }
+    return ptr;
+}
+
+void *xcalloc(size_t nmemb, size_t size) {
+    void *ptr=calloc(nmemb,size);
+    if(!ptr) {
+        calloc_error();
+    }
+    return ptr;
+}
+
+void *xrealloc(void *ptr, size_t size) {
+    ptr=realloc(ptr,size);
+    if(!ptr) {
+        realloc_error();
+    }
+    return ptr;
+}
+
+void malloc_error()
+{
+    fprintf(stderr, "xMalloc error\n");
+    exit(EXIT_FAILURE);
+}
+
+void calloc_error()
+{
+    fprintf(stderr, "Calloc error\n");
+    exit(EXIT_FAILURE);
+}
+
+void realloc_error()
+{
+    fprintf(stderr, "Realloc error\n");
+    exit(EXIT_FAILURE);
+}
+
 void printCenteredTitle(const char *title, char fill, int dim) {
 
     int len = strlen(title);

From e68b0e7bc7fb225c22e72acbb83d25218f553efe Mon Sep 17 00:00:00 2001
From: ioir123ju <549981178@qq.com>
Date: Sun, 28 Jun 2020 10:45:38 +0800
Subject: [PATCH 5/5] [BUG] Improve accuracy

---
 darknetTR.py       | 28 +++++++++++++++++++++++++---
 demo/demo/demo.cpp |  2 +-
 2 files changed, 26 insertions(+), 4 deletions(-)

diff --git a/darknetTR.py b/darknetTR.py
index d0800825..1e53148b 100644
--- a/darknetTR.py
+++ b/darknetTR.py
@@ -80,6 +80,28 @@ class DETECTION(Structure):
 # print('end')
 # print(dets[0].cl, dets[0].prob)
 
+
+def resizePadding(image, height, width):
+    desized_size = height, width
+    old_size = image.shape[:2]
+    max_size_idx = old_size.index(max(old_size))
+    ratio = float(desized_size[max_size_idx]) / max(old_size)
+    new_size = tuple([int(x * ratio) for x in old_size])
+
+    if new_size > desized_size:
+        min_size_idx = old_size.index(min(old_size))
+        ratio = float(desized_size[min_size_idx]) / min(old_size)
+        new_size = tuple([int(x * ratio) for x in old_size])
+
+    image = cv2.resize(image, (new_size[1], new_size[0]))
+    delta_w = desized_size[1] - new_size[1]
+    delta_h = desized_size[0] - new_size[0]
+    top, bottom = delta_h // 2, delta_h - (delta_h // 2)
+    left, right = delta_w // 2, delta_w - (delta_w // 2)
+
+    image = cv2.copyMakeBorder(image, top, bottom, left, right, cv2.BORDER_CONSTANT)
+    return image
+
 def detect_image(net, meta, darknet_image, thresh=.5):
     num = c_int(0)
 
@@ -102,8 +124,9 @@ def loop_detect(detect_m, video_path):
         ret, image = stream.read()
         if ret is False:
             break
-        frame_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
-        image = cv2.resize(frame_rgb,
+        # image = resizePadding(image, 512, 512)
+        # frame_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+        image = cv2.resize(image,
                            (512, 512),
                            interpolation=cv2.INTER_LINEAR)
         detections = detect_m.detect(image, need_resize=False)
@@ -150,7 +173,6 @@ def detect(self, image, need_resize=True, expand_bb=5):
                                    (self.input_size, self.input_size),
                                    interpolation=cv2.INTER_LINEAR)
             frame_data = image.ctypes.data_as(c_char_p)
-
             copy_image_from_bytes(self.darknet_image, frame_data)
 
             detections = detect_image(self.model, self.metaMain, self.darknet_image, thresh=self.thresh)
diff --git a/demo/demo/demo.cpp b/demo/demo/demo.cpp
index 582b23c1..dc493fb9 100644
--- a/demo/demo/demo.cpp
+++ b/demo/demo/demo.cpp
@@ -109,7 +109,7 @@ int main(int argc, char *argv[]) {
         } 
         if(!frame.data) 
             break;
-    
+
         //inference
         detNN->update(batch_dnn_input, n_batch);
         detNN->draw(batch_frame);