JDAI-CV
diff --git a/‎addition_module/face_parsing/README.md
+21 b/‎addition_module/face_parsing/README.md
+21
diff --git a/‎data/images/face_parsing.jpg
39 KB b/‎data/images/face_parsing.jpg
39 KB
diff --git a/‎face_sdk/README.md
+1 b/‎face_sdk/README.md
+1
diff --git a/‎face_sdk/api_usage/face_parsing.py
+108 b/‎face_sdk/api_usage/face_parsing.py
+108
diff --git a/‎face_sdk/config/model_conf.yaml
+1 b/‎face_sdk/config/model_conf.yaml
+1
diff --git a/‎face_sdk/core/model_handler/face_parsing/FaceParsingModelHandler.py
+92 b/‎face_sdk/core/model_handler/face_parsing/FaceParsingModelHandler.py
+92
diff --git a/‎face_sdk/core/model_loader/face_parsing/FaceParsingModelLoader.py
+28 b/‎face_sdk/core/model_loader/face_parsing/FaceParsingModelLoader.py
+28
diff --git a/‎face_sdk/models/face_parsing/face_parsing_1.0/model_meta.json
+8 b/‎face_sdk/models/face_parsing/face_parsing_1.0/model_meta.json
+8
diff --git a/‎face_sdk/test.jpg
39.2 KB b/‎face_sdk/test.jpg
39.2 KB
@@ -0,0 +1,21 @@
+# 
+This repo hosts the face_parsing implementation of the CVPR2022 paper "General Facial Representation Learning in a Visual-Linguistic Manner"
+
+# Some Results by FaRL
+![image](Data/images/face_parsing.jpg)
+
+# Requirements
+* python >= 3.7.1
+* pytorch >= 1.9.1
+
+# Pre-trained Model
+[face_parsing.farl.lapa]https://github.com/FacePerceiver/facer/releases/download/models-v1/face_parsing.farl.lapa.main_ema_136500_jit191.pt
+Please put the pre-trained model under FaceX-Zoo/face_sdk/models/face_parsing/face_parsing_1.0/
+# Usage
+```sh
+cd ../../face_sdk
+python api_usage/face_parsing.py
+```s
+
+# Reference  
+This project is mainly inspired by [FaRL](https://github.com/FacePerceiver/FaRL).
@@ -23,6 +23,7 @@ python api_usage/face_alignment.py  # Get 106 landmark of a face
 python api_usage/face_crop.py  # Get croped face from a image
 python api_usage/face_feature.py  # Get features of a face
 python api_usage/face_pipline.py # Run face recognition pipeline
+python api_usage/face_parsing.py # Run face parsing pipeline
 ```
 The results will be saved at [api_usage/temp](api_usage/temp)
 ## Update the models  
 
@@ -0,0 +1,108 @@
+import sys
+sys.path.append('.')
+import logging
+mpl_logger = logging.getLogger('matplotlib')
+mpl_logger.setLevel(logging.WARNING)
+import logging.config
+logging.config.fileConfig("config/logging.conf")
+logger = logging.getLogger('api')
+
+import yaml
+import cv2
+import numpy as np
+import torch
+from utils.show import show_bchw
+from utils.draw import draw_bchw
+from core.model_loader.face_parsing.FaceParsingModelLoader import FaceParsingModelLoader
+from core.model_handler.face_parsing.FaceParsingModelHandler import FaceParsingModelHandler
+from core.model_loader.face_detection.FaceDetModelLoader import FaceDetModelLoader
+from core.model_handler.face_detection.FaceDetModelHandler import FaceDetModelHandler
+from core.model_loader.face_alignment.FaceAlignModelLoader import FaceAlignModelLoader
+from core.model_handler.face_alignment.FaceAlignModelHandler import FaceAlignModelHandler
+
+with open('config/model_conf.yaml') as f:
+    model_conf = yaml.load(f,Loader=yaml.FullLoader)
+
+if __name__ == '__main__':
+    # common setting for all models, need not modify.
+    model_path = 'models'
+
+    # face detection model setting.
+    scene = 'non-mask'
+    model_category = 'face_detection'
+    model_name =  model_conf[scene][model_category]
+    logger.info('Start to load the face detection model...')
+    try:
+        faceDetModelLoader = FaceDetModelLoader(model_path, model_category, model_name)
+        model, cfg = faceDetModelLoader.load_model()
+        faceDetModelHandler = FaceDetModelHandler(model, 'cuda:0', cfg)
+    except Exception as e:
+        logger.error('Falied to load face detection Model.')
+        logger.error(e)
+        sys.exit(-1)
+    else:
+        logger.info('Success!')
+
+    # face landmark model setting.
+    model_category = 'face_alignment'
+    model_name =  model_conf[scene][model_category]
+    logger.info('Start to load the face landmark model...')
+    try:
+        faceAlignModelLoader = FaceAlignModelLoader(model_path, model_category, model_name)
+        model, cfg = faceAlignModelLoader.load_model()
+        faceAlignModelHandler = FaceAlignModelHandler(model, 'cuda:0', cfg)
+    except Exception as e:
+        logger.error('Failed to load face landmark model.')
+        logger.error(e)
+        sys.exit(-1)
+    else:
+        logger.info('Success!')        
+        
+    # face parsing model setting.
+    scene = 'non-mask'
+    model_category = 'face_parsing'
+    model_name =  model_conf[scene][model_category]
+    logger.info('Start to load the face parsing model...')
+    try:
+        faceParsingModelLoader = FaceParsingModelLoader(model_path, model_category, model_name)
+        model, cfg = faceParsingModelLoader.load_model()
+        faceParsingModelHandler = FaceParsingModelHandler(model, 'cuda:0', cfg)
+    except Exception as e:
+        logger.error('Falied to load face parsing Model.')
+        logger.error(e)
+        sys.exit(-1)
+    else:
+        logger.info('Success!')
+
+
+
+    # read image and get face features.
+    image_path = 'api_usage/test_images/test1.jpg'
+    image = cv2.imread(image_path, cv2.IMREAD_COLOR)
+    try:
+        dets = faceDetModelHandler.inference_on_image(image)
+        face_nums = dets.shape[0]
+        with torch.no_grad():
+            for i in range(face_nums):
+                landmarks = faceAlignModelHandler.inference_on_image(image, dets[i])
+
+                landmarks = torch.from_numpy(landmarks[[104,105,54,84,90]]).float()
+                if i == 0:
+                    landmarks_five = landmarks
+                else:
+                    landmarks_five = torch.stack([landmarks_five,landmarks], dim = 0)   
+
+            print(landmarks_five.shape)
+            faces = faceParsingModelHandler.inference_on_image(face_nums, image, landmarks_five)
+            seg_logits = faces['seg']['logits']
+
+
+            seg_probs = seg_logits.softmax(dim=1)  # nfaces x nclasses x h x w
+            show_bchw(draw_bchw(image, faces))  
+            
+    except Exception as e:
+        logger.error('Parsing failed!')
+        logger.error(e)
+        sys.exit(-1)
+    else:
+        logger.info('Success!')
@@ -2,6 +2,7 @@ non-mask:
     face_detection: face_detection_1.0
     face_alignment: face_alignment_1.0
     face_recognition: face_recognition_1.0
+    face_parsing: face_parsing_1.0
 mask:
     face_detection: face_detection_2.0
     face_alignment: face_alignment_2.0
 
@@ -0,0 +1,92 @@
+# based on:
+# https://github.com/FacePerceiver/facer/blob/main/facer/face_parsing/farl.py
+import functools
+import logging.config
+logging.config.fileConfig("config/logging.conf")
+logger = logging.getLogger('sdk')
+
+import torch
+import torch.nn.functional as F
+import numpy as np
+from math import ceil
+from itertools import product as product
+import torch.backends.cudnn as cudnn
+
+from core.model_handler.BaseModelHandler import BaseModelHandler
+from utils.transform import *
+
+pretrain_settings = {
+    'lapa/448': {
+        'matrix_src_tag': 'points',
+        'get_matrix_fn': functools.partial(get_face_align_matrix,
+                                           target_shape=(448, 448), target_face_scale=1.0),
+        'get_grid_fn': functools.partial(make_tanh_warp_grid,
+                                         warp_factor=0.8, warped_shape=(448, 448)),
+        'get_inv_grid_fn': functools.partial(make_inverted_tanh_warp_grid,
+                                             warp_factor=0.8, warped_shape=(448, 448)),
+        'label_names': ['background', 'face', 'rb', 'lb', 're',
+                        'le', 'nose',  'ulip', 'imouth', 'llip', 'hair']
+    }
+}
+
+
+class FaceParsingModelHandler(BaseModelHandler):
+    def __init__(self, model=None, device=None, cfg=None):
+        super().__init__(model, device, cfg)
+        
+        self.model = model.to(self.device)
+    def _preprocess(self, image, face_nums):
+        """Preprocess the image, such as standardization and other operations.
+
+        Returns:
+            A tensor, the shape is 1 x 3 x h x w.
+            A dict, {'rects','points','scores','image_ids'} 
+        """
+        if not isinstance(image, np.ndarray):
+            logger.error('The input should be the ndarray read by cv2!')
+            raise InputError()
+        img = np.float32(image)
+        img = img.transpose(2, 0, 1)
+        img = np.expand_dims(img,0).repeat(face_nums,axis=0)
+        return torch.from_numpy(img)
+    def inference_on_image(self, face_nums: int, images: torch.Tensor, landmarks):
+        """Get the inference of the image and process the inference result.
+
+        Returns:
+             
+        """
+        cudnn.benchmark = True
+        try:
+            image_pre = self._preprocess(images, face_nums)
+        except Exception as e:
+            raise e
+        setting = pretrain_settings['lapa/448']
+        images = image_pre.float() / 255.0
+        _, _, h, w = images.shape
+        simages = images.to(self.device)
+        matrix = setting['get_matrix_fn'](landmarks.to(self.device))
+        grid = setting['get_grid_fn'](matrix=matrix, orig_shape=(h, w))
+        inv_grid = setting['get_inv_grid_fn'](matrix=matrix, orig_shape=(h, w))
+
+        w_images = F.grid_sample(
+            simages, grid, mode='bilinear', align_corners=False)
+
+        w_seg_logits, _ = self.model(w_images)  # (b*n) x c x h x w
+
+        seg_logits = F.grid_sample(
+            w_seg_logits, inv_grid, mode='bilinear', align_corners=False)
+        data_pre = {}
+        data_pre['seg'] = {'logits': seg_logits,
+                       'label_names': setting['label_names']}
+        return data_pre
+    
+    def _postprocess(self, loc, conf, scale, input_height, input_width):
+        """Postprecess the prediction result.
+        Decode detection result, set the confidence threshold and do the NMS
+        to keep the appropriate detection box. 
+
+        Returns:
+            A numpy array, the shape is N * (x, y, w, h, confidence), 
+            N is the number of detection box.
+        """
+        pass
@@ -0,0 +1,28 @@
+import logging.config
+logging.config.fileConfig("config/logging.conf")
+logger = logging.getLogger('sdk')
+
+import torch
+
+from core.model_loader.BaseModelLoader import BaseModelLoader
+
+class FaceParsingModelLoader(BaseModelLoader):
+    def __init__(self, model_path, model_category, model_name, meta_file='model_meta.json'):
+        logger.info('Start to analyze the face parsing model, model path: %s, model category: %s，model name: %s' %
+                    (model_path, model_category, model_name))
+        super().__init__(model_path, model_category, model_name, meta_file)
+
+        self.cfg['input_height'] = self.meta_conf['input_height']
+        self.cfg['input_width'] = self.meta_conf['input_width']
+
+        
+    def load_model(self):
+        try:
+            model = torch.jit.load(self.cfg['model_file_path'])
+        except Exception as e:
+            logger.error('The model failed to load, please check the model path: %s!'
+                         % self.cfg['model_file_path'])
+            raise e
+        else:
+            logger.info('Successfully loaded the face parsing model!')
+            return model, self.cfg
@@ -0,0 +1,8 @@
+{
+    "model_type" : "face_parsing.farl.lapa",
+    "model_info" : "some model info",
+    "model_file" : "face_parsing.farl.lapa.main_ema_136500_jit191.pt",
+    "release_date" : "20220226",
+    "input_height" : 448,
+    "input_width" : 448
+}