global refactoring and fixes,

removed support of extracted(aligned) PNG faces. Use old builds to convert from PNG to JPG. fanseg model file in facelib/ is renamed
2025-07-06 04:52:13 -07:00 · 2020-03-13 08:09:00 +04:00 · 2020-03-13 08:09:00 +04:00 · 61472cdaf7
commit 61472cdaf7
parent 921b464d5b
82 changed files with 3838 additions and 3812 deletions
--- a/models/Model_XSeg/Model.py
+++ b/models/Model_XSeg/Model.py
@ -1,180 +0,0 @@
-import multiprocessing
-import operator
-from functools import partial
-
-import numpy as np
-
-from core import mathlib
-from core.interact import interact as io
-from core.leras import nn
-from facelib import FaceType, TernausNet
-from models import ModelBase
-from samplelib import *
-
-class XSegModel(ModelBase):
-
-    #override
-    def on_initialize_options(self):
-        device_config = nn.getCurrentDeviceConfig()
-        yn_str = {True:'y',False:'n'}
-
-        #default_resolution = 256
-  
-        ask_override = self.ask_override()
-        if self.is_first_run() or ask_override:
-            self.ask_autobackup_hour()
-            self.ask_target_iter()
-            self.ask_batch_size(24)
-
-        #if self.is_first_run():
-        #resolution = io.input_int("Resolution", default_resolution, add_info="64-512")
-        #resolution = np.clip ( (resolution // 16) * 16, 64, 512)
-        #self.options['resolution'] = resolution
-
-    #override
-    def on_initialize(self):
-        device_config = nn.getCurrentDeviceConfig()
-        self.model_data_format = "NCHW" if len(device_config.devices) != 0 and not self.is_debug() else "NHWC"
-        nn.initialize(data_format=self.model_data_format)
-        tf = nn.tf
-
-        device_config = nn.getCurrentDeviceConfig()
-        devices = device_config.devices
-
-        self.resolution = resolution = 256#self.options['resolution']
-
-        place_model_on_cpu = True#len(devices) == 0
-        models_opt_device = '/CPU:0' if place_model_on_cpu else '/GPU:0'
-
-        bgr_shape = nn.get4Dshape(resolution,resolution,3)
-        mask_shape = nn.get4Dshape(resolution,resolution,1)
- 
-        # Initializing model classes
-        self.model = TernausNet(f'{self.model_name}_SkinSeg', 
-                                 resolution, 
-                                 load_weights=not self.is_first_run(),
-                                 weights_file_root=self.get_model_root_path(),
-                                 training=True,
-                                 place_model_on_cpu=place_model_on_cpu,
-                                 data_format=nn.data_format)
-                                 
-        if self.is_training:
-            # Adjust batch size for multiple GPU
-            gpu_count = max(1, len(devices) )
-            bs_per_gpu = max(1, self.get_batch_size() // gpu_count)
-            self.set_batch_size( gpu_count*bs_per_gpu)
-
-
-            # Compute losses per GPU
-            gpu_pred_list = []
-
-            gpu_losses = []
-            gpu_loss_gvs = []
-            
-            for gpu_id in range(gpu_count):
-                with tf.device( f'/GPU:{gpu_id}' if len(devices) != 0 else f'/CPU:0' ):
-
-                    with tf.device(f'/CPU:0'):
-                        # slice on CPU, otherwise all batch data will be transfered to GPU first
-                        batch_slice = slice( gpu_id*bs_per_gpu, (gpu_id+1)*bs_per_gpu )
-                        gpu_input_t       = self.model.input_t [batch_slice,:,:,:]
-                        gpu_target_t      = self.model.target_t [batch_slice,:,:,:]                        
-                        
-                    # process model tensors
-                    gpu_pred_logits_t, gpu_pred_t = self.model.net([gpu_input_t])                    
-                    gpu_pred_list.append(gpu_pred_t)
- 
-                    gpu_loss = tf.reduce_mean( tf.nn.sigmoid_cross_entropy_with_logits(labels=gpu_target_t, logits=gpu_pred_logits_t), axis=[1,2,3])
-                    gpu_losses += [gpu_loss]
-
-                    gpu_loss_gvs += [ nn.tf_gradients ( gpu_loss, self.model.net_weights ) ]
-
-
-            # Average losses and gradients, and create optimizer update ops
-            with tf.device (models_opt_device):
-                pred = nn.tf_concat(gpu_pred_list, 0)                
-                loss = tf.reduce_mean(gpu_losses)
-                
-                loss_gv_op = self.model.opt.get_update_op (nn.tf_average_gv_list (gpu_loss_gvs))
-  
-        
-            # Initializing training and view functions
-            def train(input_np, target_np):
-                l, _ = nn.tf_sess.run ( [loss, loss_gv_op], feed_dict={self.model.input_t :input_np, self.model.target_t :target_np })
-                return l
-            self.train = train
-
-            def view(input_np):
-                return nn.tf_sess.run ( [pred], feed_dict={self.model.input_t :input_np})
-            self.view = view
-
-            # initializing sample generators
-            cpu_count = min(multiprocessing.cpu_count(), 8)
-            src_generators_count = cpu_count // 2
-            dst_generators_count = cpu_count // 2
-            src_generators_count = int(src_generators_count * 1.5)
-            
-            
-            src_generator = SampleGeneratorFaceCelebAMaskHQ ( root_path=self.training_data_src_path, debug=self.is_debug(), batch_size=self.get_batch_size(), resolution=256, generators_count=src_generators_count, data_format = nn.data_format)
-            
-            dst_generator = SampleGeneratorImage(self.training_data_dst_path, debug=self.is_debug(), batch_size=self.get_batch_size(),
-                                                sample_process_options=SampleProcessor.Options(random_flip=True),
-                                                output_sample_types = [ {'sample_type': SampleProcessor.SampleType.IMAGE,  'warp':False, 'transform':True, 'channel_type' : SampleProcessor.ChannelType.BGR, 'data_format':nn.data_format, 'resolution': resolution} ],
-                                                generators_count=dst_generators_count,
-                                                raise_on_no_data=False )
-            if not dst_generator.is_initialized():
-                io.log_info(f"\nTo view the model on unseen faces, place any image faces in {self.training_data_dst_path}.\n")
-                
-            self.set_training_data_generators ([src_generator, dst_generator])
-
-    #override
-    def get_model_filename_list(self):
-        return self.model.model_filename_list
-
-    #override
-    def onSave(self):
-        self.model.save_weights()
-        
-    #override
-    def onTrainOneIter(self):        
-        image_np, mask_np = self.generate_next_samples()[0]
-        loss = self.train (image_np, mask_np)       
-
-        return ( ('loss', loss ), )
-
-    #override
-    def onGetPreview(self, samples):
-        n_samples = min(4, self.get_batch_size(), 800 // self.resolution )
-
-        src_samples, dst_samples = samples        
-        image_np, mask_np = src_samples
-
-        I, M, IM, = [ np.clip( nn.to_data_format(x,"NHWC", self.model_data_format), 0.0, 1.0) for x in ([image_np,mask_np] + self.view (image_np) ) ]
-        M, IM, = [ np.repeat (x, (3,), -1) for x in [M, IM] ]
-
-        green_bg = np.tile( np.array([0,1,0], dtype=np.float32)[None,None,...], (self.resolution,self.resolution,1) )
-
-        result = []        
-        st = []
-        for i in range(n_samples):
-            ar = I[i]*M[i]+ green_bg*(1-M[i]), IM[i], I[i]*IM[i] + green_bg*(1-IM[i])
-            st.append ( np.concatenate ( ar, axis=1) )
-        result += [ ('XSeg training faces', np.concatenate (st, axis=0 )), ]
-        
-        if len(dst_samples) != 0:
-            dst_np, = dst_samples
-            
-
-            D, DM, = [ np.clip(nn.to_data_format(x,"NHWC", self.model_data_format), 0.0, 1.0) for x in ([dst_np] + self.view (dst_np) ) ]
-            DM, = [ np.repeat (x, (3,), -1) for x in [DM] ]
-        
-            st = []
-            for i in range(n_samples):
-                ar = D[i], DM[i], D[i]*DM[i]+ green_bg*(1-DM[i])
-                st.append ( np.concatenate ( ar, axis=1) )
-            
-            result += [ ('XSeg unseen faces', np.concatenate (st, axis=0 )), ]
-            
-        return result
-
-Model = XSegModel