added fanseg for future WF segmentation model

2025-08-20 13:33:24 -07:00 · 2020-03-08 00:49:12 +04:00 · 2020-03-08 00:49:12 +04:00 · 143792fd31
commit 143792fd31
parent 3b6ad4abf9
6 changed files with 429 additions and 112 deletions
--- a/core/leras/models.py
+++ b/core/leras/models.py
@ -9,6 +9,7 @@ def initialize_models(nn):
        def __init__(self, *args, name=None, **kwargs):
            super().__init__(name=name)
            self.layers = []
            self.layers_by_name = {}
            self.built = False
            self.args = args
            self.kwargs = kwargs
@ -31,7 +32,8 @@ def initialize_models(nn):
                    layer.build()
                self.layers.append (layer)
-
+                self.layers_by_name[layer.name] = layer
        def xor_list(self, lst1, lst2):
            return  [value for value in lst1+lst2 if (value not in lst1) or (value not in lst2)  ]
@ -76,6 +78,9 @@ def initialize_models(nn):
                weights += layer.get_weights()
            return weights
        def get_layer_by_name(self, name):
            return self.layers_by_name.get(name, None)
        def get_layers(self):
            if not self.built:
                self.build()
--- a/facelib/TernausNet.py
+++ b/facelib/TernausNet.py
@ -24,44 +24,44 @@ class TernausNet(object):
        tf = nn.tf
        class Ternaus(nn.ModelBase):
-            def on_build(self, in_ch, ch):
+            def on_build(self, in_ch, base_ch):
-                self.features_0 = nn.Conv2D (in_ch, ch, kernel_size=3, padding='SAME')
+                self.features_0 = nn.Conv2D (in_ch, base_ch, kernel_size=3, padding='SAME')
                self.blurpool_0 = nn.BlurPool (filt_size=3)
-                self.features_3 = nn.Conv2D (ch, ch*2, kernel_size=3, padding='SAME')
+                self.features_3 = nn.Conv2D (base_ch, base_ch*2, kernel_size=3, padding='SAME')
                self.blurpool_3 = nn.BlurPool (filt_size=3)
-                self.features_6 = nn.Conv2D (ch*2, ch*4, kernel_size=3, padding='SAME')
+                self.features_6 = nn.Conv2D (base_ch*2, base_ch*4, kernel_size=3, padding='SAME')
-                self.features_8 = nn.Conv2D (ch*4, ch*4, kernel_size=3, padding='SAME')
+                self.features_8 = nn.Conv2D (base_ch*4, base_ch*4, kernel_size=3, padding='SAME')
                self.blurpool_8 = nn.BlurPool (filt_size=3)
-                self.features_11 = nn.Conv2D (ch*4, ch*8, kernel_size=3, padding='SAME')
+                self.features_11 = nn.Conv2D (base_ch*4, base_ch*8, kernel_size=3, padding='SAME')
-                self.features_13 = nn.Conv2D (ch*8, ch*8, kernel_size=3, padding='SAME')
+                self.features_13 = nn.Conv2D (base_ch*8, base_ch*8, kernel_size=3, padding='SAME')
                self.blurpool_13 = nn.BlurPool (filt_size=3)
-                self.features_16 = nn.Conv2D (ch*8, ch*8, kernel_size=3, padding='SAME')
+                self.features_16 = nn.Conv2D (base_ch*8, base_ch*8, kernel_size=3, padding='SAME')
-                self.features_18 = nn.Conv2D (ch*8, ch*8, kernel_size=3, padding='SAME')
+                self.features_18 = nn.Conv2D (base_ch*8, base_ch*8, kernel_size=3, padding='SAME')
                self.blurpool_18 = nn.BlurPool (filt_size=3)
-                self.conv_center = nn.Conv2D (ch*8, ch*8, kernel_size=3, padding='SAME')
+                self.conv_center = nn.Conv2D (base_ch*8, base_ch*8, kernel_size=3, padding='SAME')
-                self.conv1_up = nn.Conv2DTranspose (ch*8, ch*4, kernel_size=3, padding='SAME')
+                self.conv1_up = nn.Conv2DTranspose (base_ch*8, base_ch*4, kernel_size=3, padding='SAME')
-                self.conv1 = nn.Conv2D (ch*12, ch*8, kernel_size=3, padding='SAME')
+                self.conv1 = nn.Conv2D (base_ch*12, base_ch*8, kernel_size=3, padding='SAME')
-                self.conv2_up = nn.Conv2DTranspose (ch*8, ch*4, kernel_size=3, padding='SAME')
+                self.conv2_up = nn.Conv2DTranspose (base_ch*8, base_ch*4, kernel_size=3, padding='SAME')
-                self.conv2 = nn.Conv2D (ch*12, ch*8, kernel_size=3, padding='SAME')
+                self.conv2 = nn.Conv2D (base_ch*12, base_ch*8, kernel_size=3, padding='SAME')
-                self.conv3_up = nn.Conv2DTranspose (ch*8, ch*2, kernel_size=3, padding='SAME')
+                self.conv3_up = nn.Conv2DTranspose (base_ch*8, base_ch*2, kernel_size=3, padding='SAME')
-                self.conv3 = nn.Conv2D (ch*6, ch*4, kernel_size=3, padding='SAME')
+                self.conv3 = nn.Conv2D (base_ch*6, base_ch*4, kernel_size=3, padding='SAME')
-                self.conv4_up = nn.Conv2DTranspose (ch*4, ch, kernel_size=3, padding='SAME')
+                self.conv4_up = nn.Conv2DTranspose (base_ch*4, base_ch, kernel_size=3, padding='SAME')
-                self.conv4 = nn.Conv2D (ch*3, ch*2, kernel_size=3, padding='SAME')
+                self.conv4 = nn.Conv2D (base_ch*3, base_ch*2, kernel_size=3, padding='SAME')
-                self.conv5_up = nn.Conv2DTranspose (ch*2, ch//2, kernel_size=3, padding='SAME')
+                self.conv5_up = nn.Conv2DTranspose (base_ch*2, base_ch//2, kernel_size=3, padding='SAME')
-                self.conv5 = nn.Conv2D (ch//2+ch, ch, kernel_size=3, padding='SAME')
+                self.conv5 = nn.Conv2D (base_ch//2+base_ch, base_ch, kernel_size=3, padding='SAME')
-                self.out_conv = nn.Conv2D (ch, 1, kernel_size=3, padding='SAME')
+                self.out_conv = nn.Conv2D (base_ch, 1, kernel_size=3, padding='SAME')
            def forward(self, inp):
                x, = inp
@ -106,92 +106,120 @@ class TernausNet(object):
                x = tf.concat( [x,x0], -1)
                x = tf.nn.relu(self.conv5(x))
-                x = tf.nn.sigmoid(self.out_conv(x))
+                logits = self.out_conv(x)
-                return x
+                return logits, tf.nn.sigmoid(logits)
        if weights_file_root is not None:
            weights_file_root = Path(weights_file_root)
        else:
            weights_file_root = Path(__file__).parent
-        self.weights_path = weights_file_root / ('%s_%d_%s.npy' % (name, resolution, face_type_str) )
+        self.weights_file_root = weights_file_root
-        e = tf.device('/CPU:0') if place_model_on_cpu else None
+        with tf.device ('/CPU:0'):
            #Place holders on CPU
            self.input_t  = tf.placeholder (nn.tf_floatx, nn.get4Dshape(resolution,resolution,3) )
            self.target_t = tf.placeholder (nn.tf_floatx, nn.get4Dshape(resolution,resolution,1) )
-        if e is not None: e.__enter__()
+        # Initializing model classes
-        self.net = Ternaus(3, 64, name='Ternaus')
+        with tf.device ('/CPU:0' if place_model_on_cpu else '/GPU:0'):
-        if load_weights:
+            self.net = Ternaus(3, 64, name='Ternaus')
-            self.net.load_weights (self.weights_path)
+            self.net_weights = self.net.get_weights()
        self.model_filename_list = [ [self.net, '%s_%d_%s.npy' % (name, resolution, face_type_str) ] ]
        if training:
            self.opt = nn.TFRMSpropOptimizer(lr=0.0001, name='opt')
            self.opt.initialize_variables (self.net_weights, vars_on_cpu=place_model_on_cpu)
            self.model_filename_list += [ [self.opt, '%s_%d_%s_opt.npy' % (name, resolution, face_type_str) ] ]
        else:
-            self.net.init_weights()
+            _, pred = self.net([self.input_t])
-        if e is not None: e.__exit__(None,None,None)
+            def net_run(input_np):
                return nn.tf_sess.run ( [pred], feed_dict={self.input_t :input_np})[0]
            self.net_run = net_run
-        self.net.build_for_run ( [(tf.float32, nn.get4Dshape (resolution,resolution,3) )] )
+        # Loading/initializing all models/optimizers weights
        for model, filename in io.progress_bar_generator(self.model_filename_list, "Initializing models"):
            do_init = not load_weights
-        if training:
+            if not do_init:
-            raise Exception("training not supported yet")
+                do_init = not model.load_weights( self.weights_file_root / filename )
            if do_init:
                model.init_weights()
                if model == self.net:
                    try:
                        with open( Path(__file__).parent / 'vgg11_enc_weights.npy', 'rb' ) as f:
                            d = pickle.loads (f.read())
-            """
+                        for i in [0,3,6,8,11,13,16,18]:
-            if training:
+                            model.get_layer_by_name ('features_%d' % i).set_weights ( d['features.%d' % i] )
-                try:
+                    except:
-                    with open( Path(__file__).parent / 'vgg11_enc_weights.npy', 'rb' ) as f:
+                        io.log_err("Unable to load VGG11 pretrained weights from vgg11_enc_weights.npy")
                        d = pickle.loads (f.read())
                    for i in [0,3,6,8,11,13,16,18]:
                        s = 'features.%d' % i
                        self.model.get_layer (s).set_weights ( d[s] )
                except:
                    io.log_err("Unable to load VGG11 pretrained weights from vgg11_enc_weights.npy")
                conv_weights_list = []
                for layer in self.model.layers:
                    if 'CA.' in layer.name:
                        conv_weights_list += [layer.weights[0]] #Conv2D kernel_weights
                CAInitializerMP ( conv_weights_list )
            """
        """
        if training:
            inp_t = Input ( (resolution, resolution, 3) )
            real_t = Input ( (resolution, resolution, 1) )
            out_t = self.model(inp_t)
            loss = K.mean(10*K.binary_crossentropy(real_t,out_t) )
            out_t_diff1 = out_t[:, 1:, :, :] - out_t[:, :-1, :, :]
            out_t_diff2 = out_t[:, :, 1:, :] - out_t[:, :, :-1, :]
            total_var_loss = K.mean( 0.1*K.abs(out_t_diff1), axis=[1, 2, 3] ) + K.mean( 0.1*K.abs(out_t_diff2), axis=[1, 2, 3] )
            opt = Adam(lr=0.0001, beta_1=0.5, beta_2=0.999, tf_cpu_mode=2)
            self.train_func = K.function  ( [inp_t, real_t], [K.mean(loss)], opt.get_updates( [loss], self.model.trainable_weights) )
        """
    def __enter__(self):
        return self
    def __exit__(self, exc_type=None, exc_value=None, traceback=None):
        return False #pass exception between __enter__ and __exit__ to outter level
    def save_weights(self):
-        self.net.save_weights (str(self.weights_path))
+        for model, filename in io.progress_bar_generator(self.model_filename_list, "Saving"):
-
+            model.save_weights( self.weights_file_root / filename )
    def train(self, inp, real):
        loss, = self.train_func ([inp, real])
        return loss
    def extract (self, input_image):
        input_shape_len = len(input_image.shape)
        if input_shape_len == 3:
-            input_image = input_image[np.newaxis,...]
+            input_image = input_image[None,...]
-        result = np.clip ( self.net.run([input_image]), 0, 1.0 )
+        result = np.clip ( self.net_run(input_image), 0, 1.0 )
        result[result < 0.1] = 0 #get rid of noise
        if input_shape_len == 3:
            result = result[0]
        return result
 """
 if load_weights:
    self.net.load_weights (self.weights_path)
 else:
    self.net.init_weights()
 if load_weights:
    self.opt.load_weights (self.opt_path)
 else:
    self.opt.init_weights()
 """
 """
 if training:
    try:
        with open( Path(__file__).parent / 'vgg11_enc_weights.npy', 'rb' ) as f:
            d = pickle.loads (f.read())
        for i in [0,3,6,8,11,13,16,18]:
            s = 'features.%d' % i
            self.model.get_layer (s).set_weights ( d[s] )
    except:
        io.log_err("Unable to load VGG11 pretrained weights from vgg11_enc_weights.npy")
    conv_weights_list = []
    for layer in self.model.layers:
        if 'CA.' in layer.name:
            conv_weights_list += [layer.weights[0]] #Conv2D kernel_weights
    CAInitializerMP ( conv_weights_list )
 """
 """
 if training:
    inp_t = Input ( (resolution, resolution, 3) )
    real_t = Input ( (resolution, resolution, 1) )
    out_t = self.model(inp_t)
    loss = K.mean(10*K.binary_crossentropy(real_t,out_t) )
    out_t_diff1 = out_t[:, 1:, :, :] - out_t[:, :-1, :, :]
    out_t_diff2 = out_t[:, :, 1:, :] - out_t[:, :, :-1, :]
    total_var_loss = K.mean( 0.1*K.abs(out_t_diff1), axis=[1, 2, 3] ) + K.mean( 0.1*K.abs(out_t_diff2), axis=[1, 2, 3] )
    opt = Adam(lr=0.0001, beta_1=0.5, beta_2=0.999, tf_cpu_mode=2)
    self.train_func = K.function  ( [inp_t, real_t], [K.mean(loss)], opt.get_updates( [loss], self.model.trainable_weights) )
 """
--- a/mainscripts/dev_misc.py
+++ b/mainscripts/dev_misc.py
@ -1,3 +1,4 @@
 import json
 import multiprocessing
 import shutil
 from pathlib import Path
@ -5,12 +6,14 @@ from pathlib import Path
 import cv2
 import numpy as np
-from DFLIMG import *
+from core import imagelib, pathex
-from facelib import FaceType, LandmarksProcessor
+from core.cv2ex import *
 from core.imagelib import IEPolys
 from core.interact import interact as io
 from core.joblib import Subprocessor
-from core import pathex, imagelib
+from core.leras import nn
-from core.cv2ex import *
+from DFLIMG import *
 from facelib import FaceType, LandmarksProcessor
 from . import Extractor, Sorter
 from .Extractor import ExtractSubprocessor
@ -393,7 +396,8 @@ def extract_fanseg(input_dir, device_args={} ):
        data = ExtractSubprocessor ([ ExtractSubprocessor.Data(filename) for filename in paths_to_extract ], 'fanseg', multi_gpu=multi_gpu, cpu_only=cpu_only).run()
 #unused in end user workflow
-def dev_test(input_dir ):
+def dev_test_68(input_dir ):
    # process 68 landmarks dataset with .pts files
    input_path = Path(input_dir)
    if not input_path.exists():
        raise ValueError('input_dir not found. Please ensure it exists.')
@ -441,7 +445,7 @@ def dev_test(input_dir ):
                    continue
                rect = LandmarksProcessor.get_rect_from_landmarks(lmrks)
-    
+
                output_filepath = output_path / (filepath.stem+'.jpg')
                img = cv2_imread(filepath)
@ -549,3 +553,108 @@ def dev_test1(input_dir):
            #import code
            #code.interact(local=dict(globals(), **locals()))
 #unused in end user workflow
 def dev_test(input_dir ):
    # extract and merge .json labelme files within the faces
    device_config = nn.DeviceConfig.GPUIndexes( nn.ask_choose_device_idxs(suggest_all_gpu=True) )
    input_path = Path(input_dir)
    if not input_path.exists():
        raise ValueError('input_dir not found. Please ensure it exists.')
    output_path = input_path.parent / (input_path.name+'_merged')
    io.log_info(f'Output dir is % {output_path}')
    if output_path.exists():
        output_images_paths = pathex.get_image_paths(output_path)
        if len(output_images_paths) > 0:
            io.input_bool("WARNING !!! \n %s contains files! \n They will be deleted. \n Press enter to continue." % (str(output_path)), False )
            for filename in output_images_paths:
                Path(filename).unlink()
    else:
        output_path.mkdir(parents=True, exist_ok=True)
    images_paths = pathex.get_image_paths(input_path)
    extract_data = []
    images_jsons = {}
    for filepath in io.progress_bar_generator(images_paths, "Processing"):
        filepath = Path(filepath)
        json_filepath = filepath.parent / (filepath.stem+'.json')
        if json_filepath.exists():
            json_dict = json.loads(json_filepath.read_text())
            images_jsons[filepath] = json_dict
            total_points = [ [x,y] for shape in json_dict['shapes'] for x,y in shape['points'] ]
            total_points = np.array(total_points)
            l,r = int(total_points[:,0].min()), int(total_points[:,0].max())
            t,b = int(total_points[:,1].min()), int(total_points[:,1].max())
            extract_data.append ( ExtractSubprocessor.Data(filepath, rects=[ [l,t,r,b] ] ) ) 
    image_size = 1024
    face_type = FaceType.HEAD  
    extract_data = ExtractSubprocessor (extract_data, 'landmarks', image_size, face_type, device_config=device_config).run()
    extract_data = ExtractSubprocessor (extract_data, 'final', image_size, face_type, final_output_path=output_path, device_config=device_config).run()
    for data in extract_data:
        filepath = output_path / (data.filepath.stem+'_0.jpg')
        dflimg = DFLIMG.load(filepath)
        image_to_face_mat = dflimg.get_image_to_face_mat()
        json_dict = images_jsons[data.filepath]
        ie_polys = IEPolys()
        for shape in json_dict['shapes']:                
            ie_poly = ie_polys.add(1)
            points = np.array( [ [x,y] for x,y in shape['points'] ] )
            points = LandmarksProcessor.transform_points(points, image_to_face_mat)
            for x,y in points:
                ie_poly.add( int(x), int(y) )
        dflimg.embed_and_set (filepath, ie_polys=ie_polys)
    """
    #mark only
    for data in extract_data:
        filepath = data.filepath
        output_filepath = output_path / (filepath.stem+'.jpg')
        img = cv2_imread(filepath)
        img = imagelib.normalize_channels(img, 3)
        cv2_imwrite(output_filepath, img, [int(cv2.IMWRITE_JPEG_QUALITY), 100] )
        json_dict = images_jsons[filepath]
        ie_polys = IEPolys()
        for shape in json_dict['shapes']:                
            ie_poly = ie_polys.add(1)               
            for x,y in shape['points']:
                ie_poly.add( int(x), int(y) )            
        DFLJPG.embed_data(output_filepath, face_type=FaceType.toString(FaceType.MARK_ONLY),
                                           landmarks=data.landmarks[0],
                                           ie_polys=ie_polys,
                                           source_filename=filepath.name,
                                           source_rect=data.rects[0],
                                           source_landmarks=data.landmarks[0]
                            )
    """
    io.log_info("Done.")
--- a/models/Model_FANSeg/Model.py
+++ b/models/Model_FANSeg/Model.py
@ -0,0 +1,171 @@
 import multiprocessing
 import operator
 from functools import partial
 import numpy as np
 from core import mathlib
 from core.interact import interact as io
 from core.leras import nn
 from facelib import FaceType, TernausNet
 from models import ModelBase
 from samplelib import *
 class FANSegModel(ModelBase):
    #override
    def on_initialize_options(self):
        device_config = nn.getCurrentDeviceConfig()
        yn_str = {True:'y',False:'n'}
        #default_resolution = 256
        default_face_type = self.options['face_type'] = self.load_or_def_option('face_type', 'wf')
        ask_override = self.ask_override()
        if self.is_first_run() or ask_override:
            self.ask_autobackup_hour()
            self.ask_write_preview_history()
            self.ask_target_iter()
            self.ask_batch_size(4)
        if self.is_first_run():
            #resolution = io.input_int("Resolution", default_resolution, add_info="64-512")
            #resolution = np.clip ( (resolution // 16) * 16, 64, 512)
            #self.options['resolution'] = resolution
            self.options['face_type'] = io.input_str ("Face type", default_face_type, ['h','mf','f','wf']).lower()
    #override
    def on_initialize(self):
        device_config = nn.getCurrentDeviceConfig()
        nn.initialize(data_format="NHWC")
        tf = nn.tf
        device_config = nn.getCurrentDeviceConfig()
        devices = device_config.devices
        self.resolution = resolution = 256#self.options['resolution']
        self.face_type = {'h'  : FaceType.HALF,
                          'mf' : FaceType.MID_FULL,
                          'f'  : FaceType.FULL,
                          'wf' : FaceType.WHOLE_FACE}[ self.options['face_type'] ]
        place_model_on_cpu = len(devices) == 0
        models_opt_device = '/CPU:0' if place_model_on_cpu else '/GPU:0'
        bgr_shape = nn.get4Dshape(resolution,resolution,3)
        mask_shape = nn.get4Dshape(resolution,resolution,1)
        # Initializing model classes
        self.model = TernausNet('FANSeg', 
                                 resolution, 
                                 FaceType.toString(self.face_type), 
                                 load_weights=not self.is_first_run(),
                                 weights_file_root=self.get_model_root_path(),
                                 training=True,
                                 place_model_on_cpu=place_model_on_cpu)
        if self.is_training:
            # Adjust batch size for multiple GPU
            gpu_count = max(1, len(devices) )
            bs_per_gpu = max(1, self.get_batch_size() // gpu_count)
            self.set_batch_size( gpu_count*bs_per_gpu)
            # Compute losses per GPU
            gpu_pred_list = []
            gpu_losses = []
            gpu_loss_gvs = []
            for gpu_id in range(gpu_count):
                with tf.device( f'/GPU:{gpu_id}' if len(devices) != 0 else f'/CPU:0' ):
                    with tf.device(f'/CPU:0'):
                        # slice on CPU, otherwise all batch data will be transfered to GPU first
                        batch_slice = slice( gpu_id*bs_per_gpu, (gpu_id+1)*bs_per_gpu )
                        gpu_input_t       = self.model.input_t [batch_slice,:,:,:]
                        gpu_target_t      = self.model.target_t [batch_slice,:,:,:]                        
                    # process model tensors
                    gpu_pred_logits_t, gpu_pred_t = self.model.net([gpu_input_t])                    
                    gpu_pred_list.append(gpu_pred_t)
                    gpu_loss = tf.reduce_mean( tf.nn.sigmoid_cross_entropy_with_logits(labels=gpu_target_t, logits=gpu_pred_logits_t), axis=[1,2,3])
                    gpu_losses += [gpu_loss]
                    gpu_loss_gvs += [ nn.tf_gradients ( gpu_loss, self.model.net_weights ) ]
            # Average losses and gradients, and create optimizer update ops
            with tf.device (models_opt_device):
                pred = nn.tf_concat(gpu_pred_list, 0)                
                loss = tf.reduce_mean(gpu_losses)
                loss_gv_op = self.model.opt.get_update_op (nn.tf_average_gv_list (gpu_loss_gvs))
            # Initializing training and view functions
            def train(input_np, target_np):
                l, _ = nn.tf_sess.run ( [loss, loss_gv_op], feed_dict={self.model.input_t :input_np, self.model.target_t :target_np })
                return l
            self.train = train
            def view(input_np):
                return nn.tf_sess.run ( [pred], feed_dict={self.model.input_t :input_np})
            self.view = view
            # initializing sample generators
            training_data_src_path = self.training_data_src_path
            #training_data_dst_path = self.training_data_dst_path
            cpu_count = min(multiprocessing.cpu_count(), 8)
            src_generators_count = cpu_count // 2
            dst_generators_count = cpu_count // 2
            src_generators_count = int(src_generators_count * 1.5)
            self.set_training_data_generators ([
                    SampleGeneratorFace(training_data_src_path, random_ct_samples_path=training_data_src_path, debug=self.is_debug(), batch_size=self.get_batch_size(),
                        sample_process_options=SampleProcessor.Options(random_flip=True),
                        output_sample_types = [ {'sample_type': SampleProcessor.SampleType.FACE_IMAGE,  'ct_mode':'idt', 'warp':True, 'transform':True, 'channel_type' : SampleProcessor.ChannelType.BGR,                                                       'face_type':self.face_type, 'motion_blur':(25, 5),  'gaussian_blur':(25,5), 'data_format':nn.data_format, 'resolution': resolution},
                                                {'sample_type': SampleProcessor.SampleType.FACE_MASK,                    'warp':True, 'transform':True, 'channel_type' : SampleProcessor.ChannelType.G,   'face_mask_type' : SampleProcessor.FaceMaskType.NONE, 'face_type':self.face_type,                                                 'data_format':nn.data_format, 'resolution': resolution},
                                              ],
                        generators_count=src_generators_count ),
                             ])
    #override
    def get_model_filename_list(self):
        return self.model.model_filename_list
    #override
    def onSave(self):
        self.model.save_weights()
    #override
    def onTrainOneIter(self):        
        ( (source_np, target_np), ) = self.generate_next_samples()
        loss = self.train (source_np, target_np)       
        return ( ('loss', loss ), )
    #override
    def onGetPreview(self, samples):
        n_samples = min(4, self.get_batch_size(), 800 // self.resolution )
        ( (source_np, target_np), )  = samples
        S, T, SM, = [ np.clip(x, 0.0, 1.0) for x in ([source_np,target_np] + self.view (source_np) ) ]
        T, SM, = [ np.repeat (x, (3,), -1) for x in [T, SM] ]
        result = []
        st = []
        for i in range(n_samples):
            ar = S[i], T[i], SM[i], S[i]*SM[i]
            #todo green bg
            st.append ( np.concatenate ( ar, axis=1) )
        result += [ ('FANSeg', np.concatenate (st, axis=0 )), ]
        return result
 Model = FANSegModel
--- a/models/Model_FANSeg/init.py
+++ b/models/Model_FANSeg/init.py
@ -0,0 +1 @@
 from .Model import Model
--- a/samplelib/SampleProcessor.py
+++ b/samplelib/SampleProcessor.py
@ -148,7 +148,28 @@ class SampleProcessor(object):
                            raise ValueError("only channel_type.G supported for the mask")
                    elif sample_type == SPST.FACE_IMAGE:
-                        img = sample_bgr
+                        img = sample_bgr                        
                        if sample_face_type == FaceType.MARK_ONLY:
                            mat  = LandmarksProcessor.get_transform_mat (sample_landmarks, warp_resolution, face_type)
                            img  = cv2.warpAffine( img,  mat, (warp_resolution,warp_resolution), flags=cv2.INTER_CUBIC )
                            img  = imagelib.warp_by_params (params, img,  warp, transform, can_flip=True, border_replicate=border_replicate)
                            img  = cv2.resize( img,  (resolution,resolution), cv2.INTER_CUBIC )
                        else:                            
                            img  = imagelib.warp_by_params (params, img,  warp, transform, can_flip=True, border_replicate=border_replicate)
                            mat = LandmarksProcessor.get_transform_mat (sample_landmarks, resolution, face_type)
                            img  = cv2.warpAffine( img, mat, (resolution,resolution), borderMode=borderMode, flags=cv2.INTER_CUBIC )
                        img = np.clip(img.astype(np.float32), 0, 1)
                        # Apply random color transfer                        
                        if ct_mode is not None and ct_sample is not None:
                            if ct_sample_bgr is None:
                               ct_sample_bgr = ct_sample.load_bgr()
                            img = imagelib.color_transfer (ct_mode, img, cv2.resize( ct_sample_bgr, (resolution,resolution), cv2.INTER_LINEAR ) )
                        if motion_blur is not None:
                            chance, mb_max_size = motion_blur
                            chance = np.clip(chance, 0, 100)
@ -171,25 +192,7 @@ class SampleProcessor(object):
                            if gblur_rnd_chance < chance:
                                img = cv2.GaussianBlur(img, (gblur_rnd_kernel,) *2 , 0)
-
+                                
                        if sample_face_type == FaceType.MARK_ONLY:
                            mat  = LandmarksProcessor.get_transform_mat (sample_landmarks, warp_resolution, face_type)
                            img  = cv2.warpAffine( img,  mat, (warp_resolution,warp_resolution), flags=cv2.INTER_CUBIC )
                            img  = imagelib.warp_by_params (params, img,  warp, transform, can_flip=True, border_replicate=border_replicate)
                            img  = cv2.resize( img,  (resolution,resolution), cv2.INTER_CUBIC )
                        else:                            
                            img  = imagelib.warp_by_params (params, img,  warp, transform, can_flip=True, border_replicate=border_replicate)
                            mat = LandmarksProcessor.get_transform_mat (sample_landmarks, resolution, face_type)
                            img  = cv2.warpAffine( img, mat, (resolution,resolution), borderMode=borderMode, flags=cv2.INTER_CUBIC )
                        img = np.clip(img.astype(np.float32), 0, 1)
                        # Apply random color transfer                        
                        if ct_mode is not None and ct_sample is not None:
                            if ct_sample_bgr is None:
                               ct_sample_bgr = ct_sample.load_bgr()
                            img = imagelib.color_transfer (ct_mode, img, cv2.resize( ct_sample_bgr, (resolution,resolution), cv2.INTER_LINEAR ) )
                        # Transform from BGR to desired channel_type
                        if channel_type == SPCT.BGR:
                            out_sample = img