Manual extractor: now you can specify face rectangle manually using ‘R Mouse button’.

It is useful for small, blurry, undetectable faces, animal faces. https://i.imgur.com/8kmVgg8.jpg Warning: such frames must be used only with XSeg workflow ! Landmarks cannot be placed on the face precisely, and they are actually used for positioning the red frame. Try to keep the red frame the same as the adjacent frames.
2025-07-06 04:52:13 -07:00 · 2020-06-02 12:31:24 +04:00 · 2020-06-02 12:31:24 +04:00 · f91a604c6d
commit f91a604c6d
parent e77865ce18
1 changed files with 95 additions and 56 deletions
--- a/mainscripts/Extractor.py
+++ b/mainscripts/Extractor.py
@ -10,6 +10,7 @@ from pathlib import Path
 import cv2
 import numpy as np
 from numpy import linalg as npla
 import facelib
 from core import imagelib
@ -94,7 +95,7 @@ class ExtractSubprocessor(Subprocessor):
                self.cached_image = ( filepath, image )
            h, w, c = image.shape
-            
+
            dflimg = DFLIMG.load (filepath)
            extract_from_dflimg = (h == w and (dflimg is not None and dflimg.has_data()) )
@ -302,16 +303,16 @@ class ExtractSubprocessor(Subprocessor):
            if not cpu_only:
                if type == 'landmarks-manual':
                    devices = [devices.get_best_device()]
-                
+
                result = []
-                
+
                for device in devices:
                    count = 1
-                    
+
                    if count == 1:
                        result += [ (device.index, 'GPU', device.name, device.total_mem_gb) ]
                    else:
-                        for i in range(count):                            
+                        for i in range(count):
                            result += [ (device.index, 'GPU', f"{device.name} #{i}", device.total_mem_gb) ]
                return result
@ -358,6 +359,7 @@ class ExtractSubprocessor(Subprocessor):
            self.cache_text_lines_img = (None, None)
            self.hide_help = False
            self.landmarks_accurate = True
            self.force_landmarks = False
            self.landmarks = None
            self.x = 0
@ -397,7 +399,6 @@ class ExtractSubprocessor(Subprocessor):
    def get_data(self, host_dict):
        if self.type == 'landmarks-manual':
            need_remark_face = False
            redraw_needed = False
            while len (self.input_data) > 0:
                data = self.input_data[0]
                filepath, data_rects, data_landmarks = data.filepath, data.rects, data.landmarks
@ -410,11 +411,12 @@ class ExtractSubprocessor(Subprocessor):
                        self.landmarks = data_landmarks.pop()
                        data_rects.clear()
                        data_landmarks.clear()
-                        redraw_needed = True
+
                        self.rect_locked = True
                        self.rect_size = ( self.rect[2] - self.rect[0] ) / 2
                        self.x = ( self.rect[0] + self.rect[2] ) / 2
                        self.y = ( self.rect[1] + self.rect[3] ) / 2
                        self.redraw()
                if len(data_rects) == 0:
                    if self.cache_original_image[0] == filepath:
@ -440,8 +442,8 @@ class ExtractSubprocessor(Subprocessor):
                        self.text_lines_img = self.cache_text_lines_img[1]
                    else:
                        self.text_lines_img = (imagelib.get_draw_text_lines ( self.image, sh,
-                                                        [   '[Mouse click] - lock/unlock selection',
+                                                        [   '[L Mouse click] - lock/unlock selection. [Mouse wheel] - change rect',
-                                                            '[Mouse wheel] - change rect',
+                                                            '[R Mouse Click] - manual face rectangle',
                                                            '[Enter] / [Space] - confirm / skip frame',
                                                            '[,] [.]- prev frame, next frame. [Q] - skip remaining frames',
                                                            '[a] - accuracy on/off (more fps)',
@ -453,8 +455,10 @@ class ExtractSubprocessor(Subprocessor):
                    while True:
                        io.process_messages(0.0001)
-                        new_x = self.x
+                        if not self.force_landmarks:
-                        new_y = self.y
+                            new_x = self.x
                            new_y = self.y
                        new_rect_size = self.rect_size
                        mouse_events = io.get_mouse_events(self.wnd_name)
@ -465,8 +469,19 @@ class ExtractSubprocessor(Subprocessor):
                                diff = 1 if new_rect_size <= 40 else np.clip(new_rect_size / 10, 1, 10)
                                new_rect_size = max (5, new_rect_size + diff*mod)
                            elif ev == io.EVENT_LBUTTONDOWN:
-                                self.rect_locked = not self.rect_locked
+                                if self.force_landmarks:
-                                self.extract_needed = True
+                                    self.x = new_x
                                    self.y = new_y
                                    self.force_landmarks = False
                                    self.rect_locked = True
                                    self.redraw()
                                else:
                                    self.rect_locked = not self.rect_locked
                                    self.extract_needed = True
                            elif ev == io.EVENT_RBUTTONDOWN:
                                self.force_landmarks = not self.force_landmarks
                                if self.force_landmarks:
                                    self.rect_locked = False
                            elif not self.rect_locked:
                                new_x = np.clip (x, 0, w-1) / self.view_scale
                                new_y = np.clip (y, 0, h-1) / self.view_scale
@ -532,11 +547,35 @@ class ExtractSubprocessor(Subprocessor):
                            self.landmarks_accurate = not self.landmarks_accurate
                            break
-                        if self.x != new_x or \
+                        if self.force_landmarks:
                            pt2 = np.float32([new_x, new_y])
                            pt1 = np.float32([self.x, self.y])
                            pt_vec_len = npla.norm(pt2-pt1)
                            pt_vec = pt2-pt1
                            if pt_vec_len != 0:
                                pt_vec /= pt_vec_len
                            self.rect_size = pt_vec_len
                            self.rect = ( int(self.x-self.rect_size),
                                          int(self.y-self.rect_size),
                                          int(self.x+self.rect_size),
                                          int(self.y+self.rect_size) )
                            if pt_vec_len > 0:
                                lmrks = np.concatenate ( (np.zeros ((17,2), np.float32), LandmarksProcessor.landmarks_2D), axis=0 )
                                lmrks -= lmrks[30:31,:]
                                mat = cv2.getRotationMatrix2D( (0, 0), -np.arctan2( pt_vec[1], pt_vec[0] )*180/math.pi , pt_vec_len)
                                mat[:, 2] += (self.x, self.y)
                                self.landmarks = LandmarksProcessor.transform_points(lmrks, mat )
                            self.redraw()
                        elif self.x != new_x or \
                           self.y != new_y or \
                           self.rect_size != new_rect_size or \
-                           self.extract_needed or \
+                           self.extract_needed:
                           redraw_needed:
                            self.x = new_x
                            self.y = new_y
                            self.rect_size = new_rect_size
@ -545,11 +584,7 @@ class ExtractSubprocessor(Subprocessor):
                                          int(self.x+self.rect_size),
                                          int(self.y+self.rect_size) )
-                            if redraw_needed:
+                            return ExtractSubprocessor.Data (filepath, rects=[self.rect], landmarks_accurate=self.landmarks_accurate)
                                redraw_needed = False
                                return ExtractSubprocessor.Data (filepath, landmarks_accurate=self.landmarks_accurate)
                            else:
                                return ExtractSubprocessor.Data (filepath, rects=[self.rect], landmarks_accurate=self.landmarks_accurate)
                else:
                    is_frame_done = True
@ -571,6 +606,40 @@ class ExtractSubprocessor(Subprocessor):
        if not self.type != 'landmarks-manual':
            self.input_data.insert(0, data)
    def redraw(self):
        (h,w,c) = self.image.shape
        if not self.hide_help:
            image = cv2.addWeighted (self.image,1.0,self.text_lines_img,1.0,0)
        else:
            image = self.image.copy()
        view_rect = (np.array(self.rect) * self.view_scale).astype(np.int).tolist()
        view_landmarks  = (np.array(self.landmarks) * self.view_scale).astype(np.int).tolist()
        if self.rect_size <= 40:
            scaled_rect_size = h // 3 if w > h else w // 3
            p1 = (self.x - self.rect_size, self.y - self.rect_size)
            p2 = (self.x + self.rect_size, self.y - self.rect_size)
            p3 = (self.x - self.rect_size, self.y + self.rect_size)
            wh = h if h < w else w
            np1 = (w / 2 - wh / 4, h / 2 - wh / 4)
            np2 = (w / 2 + wh / 4, h / 2 - wh / 4)
            np3 = (w / 2 - wh / 4, h / 2 + wh / 4)
            mat = cv2.getAffineTransform( np.float32([p1,p2,p3])*self.view_scale, np.float32([np1,np2,np3]) )
            image = cv2.warpAffine(image, mat,(w,h) )
            view_landmarks = LandmarksProcessor.transform_points (view_landmarks, mat)
        landmarks_color = (255,255,0) if self.rect_locked else (0,255,0)
        LandmarksProcessor.draw_rect_landmarks (image, view_rect, view_landmarks, self.face_type, self.image_size, landmarks_color=landmarks_color)
        self.extract_needed = False
        io.show_image (self.wnd_name, image)
    #override
    def on_result (self, host_dict, data, result):
        if self.type == 'landmarks-manual':
@ -579,37 +648,7 @@ class ExtractSubprocessor(Subprocessor):
            if len(landmarks) != 0 and landmarks[0] is not None:
                self.landmarks = landmarks[0]
-            (h,w,c) = self.image.shape
+            self.redraw()
            if not self.hide_help:
                image = cv2.addWeighted (self.image,1.0,self.text_lines_img,1.0,0)
            else:
                image = self.image.copy()
            view_rect = (np.array(self.rect) * self.view_scale).astype(np.int).tolist()
            view_landmarks  = (np.array(self.landmarks) * self.view_scale).astype(np.int).tolist()
            if self.rect_size <= 40:
                scaled_rect_size = h // 3 if w > h else w // 3
                p1 = (self.x - self.rect_size, self.y - self.rect_size)
                p2 = (self.x + self.rect_size, self.y - self.rect_size)
                p3 = (self.x - self.rect_size, self.y + self.rect_size)
                wh = h if h < w else w
                np1 = (w / 2 - wh / 4, h / 2 - wh / 4)
                np2 = (w / 2 + wh / 4, h / 2 - wh / 4)
                np3 = (w / 2 - wh / 4, h / 2 + wh / 4)
                mat = cv2.getAffineTransform( np.float32([p1,p2,p3])*self.view_scale, np.float32([np1,np2,np3]) )
                image = cv2.warpAffine(image, mat,(w,h) )
                view_landmarks = LandmarksProcessor.transform_points (view_landmarks, mat)
            landmarks_color = (255,255,0) if self.rect_locked else (0,255,0)
            LandmarksProcessor.draw_rect_landmarks (image, view_rect, view_landmarks, self.face_type, self.image_size, landmarks_color=landmarks_color)
            self.extract_needed = False
            io.show_image (self.wnd_name, image)
        else:
            self.result.append ( result )
            io.progress_bar_inc(1)
@ -690,14 +729,14 @@ def main(detector=None,
         cpu_only = False,
         force_gpu_idxs = None,
         ):
-         
+
    if not input_path.exists():
        io.log_err ('Input directory not found. Please ensure it exists.')
        return
    if face_type is not None:
        face_type = FaceType.fromString(face_type)
-        
+
    if face_type is None:
        if manual_output_debug_fix and output_path.exists():
            files = pathex.get_image_paths(output_path)
@ -705,14 +744,14 @@ def main(detector=None,
                dflimg = DFLIMG.load(Path(files[0]))
                if dflimg is not None and dflimg.has_data():
                     face_type = FaceType.fromString ( dflimg.get_face_type() )
-                
+
    if face_type is None:
        face_type = io.input_str ("Face type", 'wf', ['f','wf','head'], help_message="Full face / whole face / head. 'Whole face' covers full area of face include forehead. 'head' covers full head, but requires XSeg for src and dst faceset.").lower()
        face_type = {'f'  : FaceType.FULL,
                     'wf' : FaceType.WHOLE_FACE,
                     'head' : FaceType.HEAD}[face_type]
-    image_size = 512 if face_type < FaceType.HEAD else 768    
+    image_size = 512 if face_type < FaceType.HEAD else 768
    if detector is None:
        io.log_info ("Choose detector type.")