Styling and saves now flip back

2020-10-02 16:52:34 +02:00 · 2020-10-02 16:52:34 +02:00 · 2af58fc170
commit 2af58fc170
parent 357d481b97
3 changed files with 79 additions and 47 deletions
--- a/README.md
+++ b/README.md
@ -11,21 +11,24 @@ A `mirror` which shows which faces are detected through three different facial d

 The installation in Windows can be done, though it is quite elaborate:

-* Install rustup-init
-* Install VS C++
 * Install python3
+* Install VS C++
 * Install Cmake (needed for python dlib)
    + make sure to add it to path 
 * Install git
    + including ssh deploy key
 * `git clone https://git.rubenvandeven.com/r/face_detector`
 * `cd face_recognition`
-* `git submodules init`
-* `git submodules update`
 * `pip install virtualenv`
 * `virtualenv.exe venv`
 * `.\venv\Scripts\activate`
 * `cd .\dnn\face_detector`
 * `python.exe .\download_weights.py`
 * `cd .\visualhaar`
+* Either one of:
+    + Compile rust library
+        * Install rustup-init
+        * `git submodules init`
+        * `git submodules update`
        * `cargo build --lib --release`
+    + Download dll from https://git.rubenvandeven.com/r/visualhaar/releases
--- a/face_recognition/comparison.py
+++ b/face_recognition/comparison.py
@ -11,9 +11,9 @@ from PIL import ImageFont, ImageDraw, Image
 import os

 draw_colors = {
-    'hog': (255,255,255), #(198,65,124),
+    'hog': (198,65,124),
    'haar': (255,255,255),
-    'dnn': (255,255,255) #(251,212,36),
+    'dnn': (251,212,36),
 }

 titles = {
@ -45,42 +45,47 @@ class Result():
        })
        return self
    
-    def draw_detections(self, include_title = False):
+    def draw_detections(self, include_title = False, coloured=False):
        cv2_im_rgb = cv2.cvtColor(self.visualisation,cv2.COLOR_BGR2RGB)
        # Pass the image to PIL
        pil_im = Image.fromarray(cv2_im_rgb)
        draw = ImageDraw.Draw(pil_im, 'RGBA')

-        self.draw_detections_on(draw)
+        self.draw_detections_on(draw, coloured)

        if include_title:
-            draw.text((10,10), titles[self.algorithm], fill=draw_colors[self.algorithm], font=font)
+            color = draw_colors[self.algorithm] if coloured else (255,255,255)  
+            draw.text((10,10), titles[self.algorithm], fill=color, font=font, stroke_width=1, stroke_fill=(0,0,0,100))

        return cv2.cvtColor(np.array(pil_im), cv2.COLOR_RGB2BGR)
    
-    def draw_detections_on(self, draw: ImageDraw):
+    def draw_detections_on(self, draw: ImageDraw, coloured=False):
        '''
        Draw on a specified canvas
        '''
-        color = draw_colors[self.algorithm]  
+        color = draw_colors[self.algorithm] if coloured else (255,255,255)  
        for detection in self.detections:
            self.draw_detection(draw, detection, color)

    def draw_detection(self, draw: ImageDraw, detection: dict, color: tuple):
-        width = 2
+       

        if detection['confidence'] > self.confidence_threshold:
+            width = 8
            # draw the bounding box of the face along with the associated
            # probability
            text = "{:.2f}%".format(detection['confidence'] * 100)
            y = detection['startY'] - 40 if detection['startY'] - 40 > 10 else detection['startY'] + 10
            
-            draw.text((detection['startX'], y), text, font=font, fill=color)
+            draw.text((detection['startX'], y), text, font=font, fill=color, stroke_fill=(0,0,0,100), stroke_width=1)
            # cv2.putText(self.visualisation, text, (detection['startX'], y),
            #     cv2.FONT_HERSHEY_SIMPLEX, 0.45, color, 2, lineType = cv2.LINE_AA)

            alpha = 1
+            draw.rectangle((detection['startX']-1, detection['startY']-1, detection['endX']+1, detection['endY']+1), outline=(0,0,0,100), width=1)
+            draw.rectangle((detection['startX']+width, detection['startY']+width, detection['endX']-width, detection['endY']-width), outline=(0,0,0,100), width=1)
        else:
+            width = int(detection['confidence'] * 10 * 8)
            # At least 10% opacity
            alpha = max(.2, detection['confidence'])

@ -90,16 +95,28 @@ class Result():
        
        draw.rectangle((detection['startX'], detection['startY'], detection['endX'], detection['endY']), outline=color, width=width)
        
-
-    def resize(self, width, height):
+    def resize(self, width, height, flip=False):
        # TODO resize to new target incl all detections
        img = self.visualisation
        factor_x = width / self.visualisation.shape[1]
        factor_y = height / self.visualisation.shape[0]
        inter = cv2.INTER_NEAREST if self.algorithm in ['dnn', 'haar'] else cv2.INTER_CUBIC
        img = cv2.resize(img, (width, height), interpolation=inter)
+
+        if flip:
+            img = cv2.flip(img, 1)
+
        result = Result(self.algorithm, img, self.confidence_threshold)
        for d in self.detections:
+            if flip:
+                result.add_detection(
+                    int(width - d['endX'] * factor_x), 
+                    int(d['startY'] * factor_y), 
+                    int(width - d['startX'] * factor_x), 
+                    int(d['endY'] * factor_y),
+                    d['confidence']
+                    )
+            else:
                result.add_detection(
                    int(d['startX'] * factor_x), 
                    int(d['startY'] * factor_y), 
@ -330,7 +347,7 @@ def process2_dnn(in_q, out_q):

        out_q.put(result)

-def process3_haar(in_q, out_q, cascade_file):
+def process3_haar(in_q, out_q, cascade_file, library_filename = None):
    from cffi import FFI
    from PIL import Image
    import cv2
@ -347,6 +364,10 @@ def process3_haar(in_q, out_q, cascade_file):
        void scan_image(haarclassifier, size_t width,size_t height, char *input, char *buffer, size_t length, size_t min_face_factor, bool debug);
    """)

+    
+    if library_filename is not None:
+        C = ffi.dlopen(library_filename)
+    else:
        dir_path = os.path.dirname(os.path.realpath(__file__))
        
        lib_path = os.path.join(dir_path, "..", "visualhaar", "target", "release")
@ -358,7 +379,7 @@ def process3_haar(in_q, out_q, cascade_file):
        elif os.path.exists(dll_path):
            C = ffi.dlopen(dll_path)
        else:
-        raise RuntimeException("Visual haarcascades library is not found")
+            raise RuntimeError("Visual haarcascades library is not found")

    # print(C.test(9))
    # i = Image.open("Marjo.jpg")
@ -434,10 +455,13 @@ def process3_haar(in_q, out_q, cascade_file):
        # print(img)
        out_q.put(result)

-def draw_stats(image, results, padding):
+def draw_stats(image, results, padding, coloured=False):
    pil_im = Image.fromarray(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
    draw = ImageDraw.Draw(pil_im, 'RGBA')
+    draw_stats_on_canvas(draw, results, padding, coloured)
+    return cv2.cvtColor(np.array(pil_im), cv2.COLOR_RGB2BGR)
    
+def draw_stats_on_canvas(draw, results, padding, coloured=False):
    for i, result in enumerate(results):
        if result is None:
            continue
@ -446,9 +470,9 @@ def draw_stats(image, results, padding):
        txt = "face" if c == 1 else "faces"
        txt = f"{result.algorithm.ljust(5)} {c} {txt}"
        height = padding + 25
-        draw.text((padding, pil_im.size[1] - i*height - height), txt, fill=draw_colors[result.algorithm], font=font_s, stroke_width=1, stroke_fill=(0,0,0))
+        colour = draw_colors[result.algorithm] if coloured else (255,255,255)
+        draw.text((padding, draw.im.size[1] - i*height - height), txt, fill=colour, font=font_s, stroke_width=1, stroke_fill=(0,0,0))

-    return cv2.cvtColor(np.array(pil_im), cv2.COLOR_RGB2BGR)
    

 def display(image_res, q1, q2, q3, q4, fullscreen, output_dir):
@ -543,7 +567,7 @@ def display(image_res, q1, q2, q3, q4, fullscreen, output_dir):
            if countdown_until:
                duration = math.ceil(countdown_until - time.time())
                w, h = draw.textsize(f"{duration}", font=countdown_font)
-                draw.text(((grid_img.shape[1]-w)/2,(grid_img.shape[0]-h)/2), f"{duration}", fill="white", stroke="black", font=countdown_font)
+                draw.text(((grid_img.shape[1]-w)/2,(grid_img.shape[0]-h)/2), f"{duration}", fill="white", stroke="black", font=countdown_font, stroke_width=1, stroke_fill=(0,0,0,100))

            grid_img = cv2.cvtColor(np.array(pil_im), cv2.COLOR_RGB2BGR)
            
@ -565,7 +589,7 @@ def display(image_res, q1, q2, q3, q4, fullscreen, output_dir):
            # SNAP!
            # output_res = (image_res[0] *2, image_res[1] * 2)
            output_res = image_res # no scaling needed anyore
-            pil_im = Image.fromarray(cv2.cvtColor(images[0], cv2.COLOR_BGR2RGB))
+            pil_im = Image.fromarray(cv2.cvtColor(cv2.flip(images[0],1), cv2.COLOR_BGR2RGB))
            pil_im = pil_im.resize(output_res)
            draw = ImageDraw.Draw(pil_im, 'RGBA')

@ -573,7 +597,9 @@ def display(image_res, q1, q2, q3, q4, fullscreen, output_dir):
                if result is None:
                    continue

-                result.resize(output_res[0], output_res[1]).draw_detections_on(draw)
+                result.resize(output_res[0], output_res[1], flip=True).draw_detections_on(draw, coloured=True)
+
+            draw_stats_on_canvas(draw, results, padding, coloured=True)

            override_image = cv2.cvtColor(np.array(pil_im), cv2.COLOR_RGB2BGR)
            override_until = time.time() + 5
@ -583,12 +609,13 @@ def display(image_res, q1, q2, q3, q4, fullscreen, output_dir):
            name = datetime.datetime.now().isoformat(timespec='seconds')
            cv2.imwrite(os.path.join(output_dir, f'{name}.png'),override_image)
            for result in results:
-                cv2.imwrite(os.path.join(output_dir, f'{name}-{result.algorithm}.png'),result.visualisation)
+                result_img =result.draw_detections(include_title = True)
+                cv2.imwrite(os.path.join(output_dir, f'{name}-{result.algorithm}.png'), result_img)

            


-def main(camera_id, rotate, fullscreen, cascade_file, output_dir):
+def main(camera_id, rotate, fullscreen, cascade_file, output_dir, visualhaar_lib = None):
    image_size = (1920, 1080) #(int(1920/2), int(1080/2))

    if not os.path.exists(cascade_file):
@ -616,7 +643,7 @@ def main(camera_id, rotate, fullscreen, cascade_file, output_dir):
    p2 = Process(target=display, args=(image_size, q_webcam1, q_process1, q_process2, q_process3, fullscreen, output_dir ))
    p3 = Process(target=process1_hog, args=(q_webcam2, q_process1,))
    p4 = Process(target=process2_dnn, args=(q_webcam3, q_process2,))
-    p5 = Process(target=process3_haar, args=(q_webcam4, q_process3,cascade_file))
+    p5 = Process(target=process3_haar, args=(q_webcam4, q_process3,cascade_file, visualhaar_lib))

    p1.start()
    p2.start()
--- a/mirror.py
+++ b/mirror.py
@ -15,8 +15,10 @@ if __name__ == '__main__':
                        help='Rotate counter clockwise')
    parser.add_argument('--cascade', default='haarcascade_frontalface_alt2.xml',
                        help='Cascade XML file to use (opencv format)')
-    parser.add_argument('--output', default='saves',
+    parser.add_argument('--output', metavar="DIRECTORY", default='saves',
                        help='Directory to store images (after pressing spacebar)')
+    parser.add_argument('--visualhaar-lib', metavar="LIBRARY", default=None,
+                        help='path/filename for visualhaar library (.so on linux, .dll on windows)\nSee: https://git.rubenvandeven.com/r/visualhaar/releases')

    args = parser.parse_args()

@ -26,4 +28,4 @@ if __name__ == '__main__':
    if args.counter_clockwise:
        rotate = cv2.ROTATE_90_COUNTERCLOCKWISE

-    face_recognition.comparison.main(args.camera, rotate, args.fullscreen, args.cascade, args.output)
+    face_recognition.comparison.main(args.camera, rotate, args.fullscreen, args.cascade, args.output, args.visualhaar_lib)