Added interactive converter.

With interactive converter you can change any parameter of any frame and see the result in real time. Converter: added motion_blur_power param. Motion blur is applied by precomputed motion vectors. So the moving face will look more realistic. RecycleGAN model is removed. Added experimental AVATAR model. Minimum required VRAM is 6GB (NVIDIA), 12GB (AMD) Usage: 1) place data_src.mp4 10-20min square resolution video of news reporter sitting at the table with static background, other faces should not appear in frames. 2) process "extract images from video data_src.bat" with FULL fps 3) place data_dst.mp4 video of face who will control the src face 4) process "extract images from video data_dst FULL FPS.bat" 5) process "data_src mark faces S3FD best GPU.bat" 6) process "data_dst extract unaligned faces S3FD best GPU.bat" 7) train AVATAR.bat stage 1, tune batch size to maximum for your card (32 for 6GB), train to 50k+ iters. 8) train AVATAR.bat stage 2, tune batch size to maximum for your card (4 for 6GB), train to decent sharpness. 9) convert AVATAR.bat 10) converted to mp4.bat updated versions of modules
2025-07-06 04:52:13 -07:00 · 2019-08-24 12:57:29 +04:00 · 2019-08-24 12:57:29 +04:00 · 407ce3b1ca
commit 407ce3b1ca
parent 3f0bf2e994
46 changed files with 2394 additions and 1659 deletions
--- a/models/ModelBase.py
+++ b/models/ModelBase.py
@ -25,11 +25,11 @@ class ModelBase(object):

    def __init__(self, model_path, training_data_src_path=None, training_data_dst_path=None, pretraining_data_path=None, debug = False, device_args = None,
                 ask_enable_autobackup=True,
-                 ask_write_preview_history=True, 
-                 ask_target_iter=True, 
-                 ask_batch_size=True, 
+                 ask_write_preview_history=True,
+                 ask_target_iter=True,
+                 ask_batch_size=True,
                 ask_sort_by_yaw=True,
-                 ask_random_flip=True, 
+                 ask_random_flip=True,
                 ask_src_scale_mod=True):

        device_args['force_gpu_idx'] = device_args.get('force_gpu_idx',-1)
@ -55,7 +55,7 @@ class ModelBase(object):
        self.training_data_src_path = training_data_src_path
        self.training_data_dst_path = training_data_dst_path
        self.pretraining_data_path = pretraining_data_path
-        
+
        self.src_images_paths = None
        self.dst_images_paths = None
        self.src_yaw_images_paths = None
@ -106,7 +106,7 @@ class ModelBase(object):
            choose_preview_history = io.input_bool("Randomly choose new image for preview history? (y/n ?:help skip:%s) : " % (yn_str[False]), False, help_message="Preview image history will stay stuck with old faces if you reuse the same model on different celebs. Choose no unless you are changing src/dst to a new person")
        else:
            choose_preview_history = False
-        
+
        if ask_target_iter:
            if (self.iter == 0 or ask_override):
                self.options['target_iter'] = max(0, io.input_int("Target iteration (skip:unlimited/default) : ", 0))
@ -121,7 +121,7 @@ class ModelBase(object):
        else:
            self.options['batch_size'] = self.options.get('batch_size', 0)

-        if ask_sort_by_yaw:            
+        if ask_sort_by_yaw:
            if (self.iter == 0 or ask_override):
                default_sort_by_yaw = self.options.get('sort_by_yaw', False)
                self.options['sort_by_yaw'] = io.input_bool("Feed faces to network sorted by yaw? (y/n ?:help skip:%s) : " % (yn_str[default_sort_by_yaw]), default_sort_by_yaw, help_message="NN will not learn src face directions that don't match dst face directions. Do not use if the dst face has hair that covers the jaw." )
@ -139,7 +139,7 @@ class ModelBase(object):
                self.options['src_scale_mod'] = np.clip( io.input_int("Src face scale modifier % ( -30...30, ?:help skip:0) : ", 0, help_message="If src face shape is wider than dst, try to decrease this value to get a better result."), -30, 30)
            else:
                self.options['src_scale_mod'] = self.options.get('src_scale_mod', 0)
-                
+
        self.autobackup = self.options.get('autobackup', False)
        if not self.autobackup and 'autobackup' in self.options:
            self.options.pop('autobackup')
@ -180,10 +180,10 @@ class ModelBase(object):
            else:
                self.preview_history_path = self.model_path / ( '%d_%s_history' % (self.device_args['force_gpu_idx'], self.get_model_name()) )
                self.autobackups_path = self.model_path / ( '%d_%s_autobackups' % (self.device_args['force_gpu_idx'], self.get_model_name()) )
-                
+
            if self.autobackup:
                self.autobackup_current_hour = time.localtime().tm_hour
-                
+
                if not self.autobackups_path.exists():
                    self.autobackups_path.mkdir(exist_ok=True)

@ -202,7 +202,7 @@ class ModelBase(object):
                    if not isinstance(generator, SampleGeneratorBase):
                        raise ValueError('training data generator is not subclass of SampleGeneratorBase')

-            if self.sample_for_preview is None or choose_preview_history:                
+            if self.sample_for_preview is None or choose_preview_history:
                if choose_preview_history and io.is_support_windows():
                    wnd_name = "[p] - next. [enter] - confirm."
                    io.named_window(wnd_name)
@ -221,25 +221,25 @@ class ModelBase(object):
                                break
                            elif key == ord('p'):
                                break
-                                
+
                            try:
                                io.process_messages(0.1)
                            except KeyboardInterrupt:
                                choosed = True
-                                        
+
                    io.destroy_window(wnd_name)
-                else:    
-                    self.sample_for_preview = self.generate_next_sample()                    
+                else:
+                    self.sample_for_preview = self.generate_next_sample()
                self.last_sample = self.sample_for_preview
-                
+
        ###Generate text summary of model hyperparameters
        #Find the longest key name and value string. Used as column widths.
        width_name = max([len(k) for k in self.options.keys()] + [17]) + 1 # Single space buffer to left edge. Minimum of 17, the length of the longest static string used "Current iteration"
        width_value = max([len(str(x)) for x in self.options.values()] + [len(str(self.iter)), len(self.get_model_name())]) + 1 # Single space buffer to right edge
        if not self.device_config.cpu_only: #Check length of GPU names
-            width_value = max([len(nnlib.device.getDeviceName(idx))+1 for idx in self.device_config.gpu_idxs] + [width_value]) 
+            width_value = max([len(nnlib.device.getDeviceName(idx))+1 for idx in self.device_config.gpu_idxs] + [width_value])
        width_total = width_name + width_value + 2 #Plus 2 for ": "
-        
+
        model_summary_text = []
        model_summary_text += [f'=={" Model Summary ":=^{width_total}}=='] # Model/status summary
        model_summary_text += [f'=={" "*width_total}==']
@ -247,13 +247,13 @@ class ModelBase(object):
        model_summary_text += [f'=={" "*width_total}==']
        model_summary_text += [f'=={"Current iteration": >{width_name}}: {str(self.iter): <{width_value}}=='] # Iter
        model_summary_text += [f'=={" "*width_total}==']
-        
+
        model_summary_text += [f'=={" Model Options ":-^{width_total}}=='] # Model options
        model_summary_text += [f'=={" "*width_total}==']
        for key in self.options.keys():
            model_summary_text += [f'=={key: >{width_name}}: {str(self.options[key]): <{width_value}}=='] # self.options key/value pairs
        model_summary_text += [f'=={" "*width_total}==']
-        
+
        model_summary_text += [f'=={" Running On ":-^{width_total}}=='] # Training hardware info
        model_summary_text += [f'=={" "*width_total}==']
        if self.device_config.multi_gpu:
@ -266,10 +266,10 @@ class ModelBase(object):
                model_summary_text += [f'=={"Device index": >{width_name}}: {idx: <{width_value}}=='] # GPU hardware device index
                model_summary_text += [f'=={"Name": >{width_name}}: {nnlib.device.getDeviceName(idx): <{width_value}}=='] # GPU name
                vram_str = f'{nnlib.device.getDeviceVRAMTotalGb(idx):.2f}GB' # GPU VRAM - Formated as #.## (or ##.##)
-                model_summary_text += [f'=={"VRAM": >{width_name}}: {vram_str: <{width_value}}=='] 
+                model_summary_text += [f'=={"VRAM": >{width_name}}: {vram_str: <{width_value}}==']
        model_summary_text += [f'=={" "*width_total}==']
        model_summary_text += [f'=={"="*width_total}==']
-        
+
        if not self.device_config.cpu_only and self.device_config.gpu_vram_gb[0] <= 2: # Low VRAM warning
            model_summary_text += ["/!\\"]
            model_summary_text += ["/!\\ WARNING:"]
@ -277,7 +277,7 @@ class ModelBase(object):
            model_summary_text += ["/!\\ If training does not start, close all programs and try again."]
            model_summary_text += ["/!\\ Also you can disable Windows Aero Desktop to increase available VRAM."]
            model_summary_text += ["/!\\"]
- 
+
        model_summary_text = "\n".join (model_summary_text)
        self.model_summary_text = model_summary_text
        io.log_info(model_summary_text)
@ -323,6 +323,11 @@ class ModelBase(object):
    def get_model_filename_list(self):
        return []

+    #overridable
+    def get_ConverterConfig(self):
+        #return ConverterConfig() for the model
+        raise NotImplementedError
+
    #overridable
    def get_converter(self):
        raise NotImplementedError
@ -372,9 +377,9 @@ class ModelBase(object):
        }
        self.model_data_path.write_bytes( pickle.dumps(model_data) )

-        bckp_filename_list = [ self.get_strpath_storage_for_file(filename) for _, filename in self.get_model_filename_list() ]        
-        bckp_filename_list += [ str(summary_path), str(self.model_data_path) ] 
-        
+        bckp_filename_list = [ self.get_strpath_storage_for_file(filename) for _, filename in self.get_model_filename_list() ]
+        bckp_filename_list += [ str(summary_path), str(self.model_data_path) ]
+
        if self.autobackup:
            current_hour = time.localtime().tm_hour
            if self.autobackup_current_hour != current_hour:
@ -383,20 +388,20 @@ class ModelBase(object):
                for i in range(15,0,-1):
                    idx_str = '%.2d' % i
                    next_idx_str = '%.2d' % (i+1)
-                    
+
                    idx_backup_path = self.autobackups_path / idx_str
                    next_idx_packup_path = self.autobackups_path / next_idx_str
-                    
+
                    if idx_backup_path.exists():
-                        if i == 15: 
+                        if i == 15:
                            Path_utils.delete_all_files(idx_backup_path)
                        else:
                            next_idx_packup_path.mkdir(exist_ok=True)
                            Path_utils.move_all_files (idx_backup_path, next_idx_packup_path)
-                            
+
                    if i == 1:
-                        idx_backup_path.mkdir(exist_ok=True)                    
-                        for filename in bckp_filename_list:                   
+                        idx_backup_path.mkdir(exist_ok=True)
+                        for filename in bckp_filename_list:
                            shutil.copy ( str(filename), str(idx_backup_path / Path(filename).name) )

                        previews = self.get_previews()
@ -440,7 +445,7 @@ class ModelBase(object):
            model.save_weights( filename + '.tmp' )

        rename_list = model_filename_list
-        
+
        """
        #unused
        , optimizer_filename_list=[]
@ -464,7 +469,7 @@ class ModelBase(object):
            except Exception as e:
                print ("Unable to save ", opt_filename)
        """
-        
+
        for _, filename in rename_list:
            filename = self.get_strpath_storage_for_file(filename)
            source_filename = Path(filename+'.tmp')
@ -473,7 +478,7 @@ class ModelBase(object):
                if target_filename.exists():
                    target_filename.unlink()
                source_filename.rename ( str(target_filename) )
-                
+
    def debug_one_iter(self):
        images = []
        for generator in self.generator_list:
@ -579,8 +584,8 @@ class ModelBase(object):

        lh_height = 100
        lh_img = np.ones ( (lh_height,w,c) ) * 0.1
-        
-        if len(loss_history) != 0:        
+
+        if len(loss_history) != 0:
            loss_count = len(loss_history[0])
            lh_len = len(loss_history)