4 年之前 · 192e8f8199
--- a/README.md
+++ b/README.md
@@ -0,0 +1,29 @@
 
				+# FaceSwap
			
 
				+Swap face between two photos for Python 3 with OpenCV and dlib.
			
 
				+
			
 
				+## Get Started
			
 
				+```sh
			
 
				+python main.py --src imgs/test6.jpg --dst imgs/test7.jpg --out results/output6_7.jpg
			
 
				+```
			
 
				+
			
 
				+| Source | Destination | Result |
			
 
				+| --- | --- | --- |
			
 
				+|![](imgs/test7.jpg) | ![](imgs/test6.jpg) | ![](results/output7_6.jpg) |
			
 
				+
			
 
				+
			
 
				+
			
 
				+```sh
			
 
				+python main.py --src imgs/test6.jpg --dst imgs/test7.jpg --out results/output6_7.jpg --point_plot True
			
 
				+```
			
 
				+![](imgs/landmark_vis) 
			
 
				+
			
 
				+## Dlib landmarks points
			
 
				+![](imgs/68points.jpg)
			
 
				+
			
 
				+
			
 
				+## Install
			
 
				+### Requirements
			
 
				+* `pip install -r requirements.txt`
			
 
				+* OpenCV 3: `conda install opencv` (If you have conda/anaconda)
			
 
				+
			
 
				+Note: See [requirements.txt](requirements.txt) for more details.
			
--- a/face_detection.py
+++ b/face_detection.py
@@ -0,0 +1,117 @@
 
				+import cv2
			
 
				+import dlib
			
 
				+import numpy as np
			
 
				+
			
 
				+## Face detection
			
 
				+def face_detection(img,upsample_times=1):
			
 
				+    # Ask the detector to find the bounding boxes of each face. The 1 in the
			
 
				+    # second argument indicates that we should upsample the image 1 time. This
			
 
				+    # will make everything bigger and allow us to detect more faces.
			
 
				+    detector = dlib.get_frontal_face_detector()
			
 
				+    faces = detector(img, upsample_times)
			
 
				+
			
 
				+    return faces
			
 
				+
			
 
				+PREDICTOR_PATH = 'models/shape_predictor_68_face_landmarks.dat'
			
 
				+predictor = dlib.shape_predictor(PREDICTOR_PATH)
			
 
				+
			
 
				+## Face and points detection
			
 
				+def face_points_detection(img, bbox:dlib.rectangle):
			
 
				+    # Get the landmarks/parts for the face in box d.
			
 
				+    shape = predictor(img, bbox)
			
 
				+
			
 
				+    # loop over the 68 facial landmarks and convert them
			
 
				+    # to a 2-tuple of (x, y)-coordinates
			
 
				+    coords = np.asarray(list([p.x, p.y] for p in shape.parts()), dtype=np.int)
			
 
				+
			
 
				+    # return the array of (x, y)-coordinates
			
 
				+    return coords
			
 
				+
			
 
				+
			
 
				+def select_face(im, r=10, choose=True):
			
 
				+    faces = face_detection(im)
			
 
				+
			
 
				+    if len(faces) == 0:
			
 
				+        return None, None, None
			
 
				+
			
 
				+    if len(faces) == 1 or not choose:
			
 
				+        idx = int(np.argmax([(face.right() - face.left()) * (face.bottom() - face.top()) for face in faces]))
			
 
				+        bbox = faces[idx]
			
 
				+    else:
			
 
				+        bbox = []
			
 
				+
			
 
				+        def click_on_face(event, x, y, flags, params):
			
 
				+            if event != cv2.EVENT_LBUTTONDOWN:
			
 
				+                return
			
 
				+
			
 
				+            for face in faces:
			
 
				+                if face.left() < x < face.right() and face.top() < y < face.bottom():
			
 
				+                    bbox.append(face)
			
 
				+                    break
			
 
				+
			
 
				+        im_copy = im.copy()
			
 
				+        for face in faces:
			
 
				+            # draw the face bounding box
			
 
				+            cv2.rectangle(im_copy, (face.left(), face.top()), (face.right(), face.bottom()), (0, 0, 255), 1)
			
 
				+        cv2.imshow('Click the Face:', im_copy)
			
 
				+        cv2.setMouseCallback('Click the Face:', click_on_face)
			
 
				+        while len(bbox) == 0:
			
 
				+            cv2.waitKey(1)
			
 
				+        cv2.destroyAllWindows()
			
 
				+        bbox = bbox[0]
			
 
				+
			
 
				+    points = np.asarray(face_points_detection(im, bbox))
			
 
				+
			
 
				+    im_w, im_h = im.shape[:2]
			
 
				+    left, top = np.min(points, 0)
			
 
				+    right, bottom = np.max(points, 0)
			
 
				+
			
 
				+    x, y = max(0, left - r), max(0, top - r)
			
 
				+    w, h = min(right + r, im_h) - x, min(bottom + r, im_w) - y
			
 
				+
			
 
				+    return points - np.asarray([[x, y]]), (x, y, w, h), im[y:y + h, x:x + w]
			
 
				+
			
 
				+
			
 
				+def get_landmarks(im):
			
 
				+    """
			
 
				+    Function that returns the face landmarks.
			
 
				+    """
			
 
				+    rects = face_detection(im, upsample_times=1)
			
 
				+    
			
 
				+    if len(rects) > 1:
			
 
				+        #print("Too Many Faces") #raise TooManyFaces
			
 
				+        return []
			
 
				+    if len(rects) == 0:
			
 
				+        #print("No Faces") #raise NoFaces
			
 
				+        return []
			
 
				+
			
 
				+    return np.matrix([[p.x, p.y] for p in predictor(im, rects[0]).parts()])
			
 
				+
			
 
				+SCALE_FACTOR = 1 
			
 
				+def read_im_and_landmarks(fname):
			
 
				+    """
			
 
				+    Function that read the images and gets the face landmarks
			
 
				+    in the read images.
			
 
				+    """
			
 
				+    im = cv2.imread(fname, cv2.IMREAD_COLOR)
			
 
				+    im = cv2.resize(im, (im.shape[1] * SCALE_FACTOR,
			
 
				+                         im.shape[0] * SCALE_FACTOR))
			
 
				+    s = get_landmarks(im)
			
 
				+
			
 
				+    return im, s
			
 
				+
			
 
				+
			
 
				+def mask_mouth(source_img):
			
 
				+    img, marks = read_im_and_landmarks(source_img)
			
 
				+    
			
 
				+    tmp_img=img.copy()
			
 
				+    tmp_blank_img=img.copy()
			
 
				+    tmp_blank_img=tmp_blank_img*0
			
 
				+    
			
 
				+    mask_list=marks[49:61]
			
 
				+
			
 
				+    draw_img=cv2.drawContours(tmp_blank_img,[mask_list],-1,(255,255,255),-1)
			
 
				+    draw_img_re=cv2.bitwise_not(draw_img)
			
 
				+    tmp_img=tmp_img&draw_img_re
			
 
				+    
			
 
				+    return tmp_img
			
--- a/face_swap.py
+++ b/face_swap.py
@@ -0,0 +1,238 @@
 
				+#! /usr/bin/env python
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+import scipy.spatial as spatial
			
 
				+import logging
			
 
				+
			
 
				+
			
 
				+## 3D Transform
			
 
				+def bilinear_interpolate(img, coords):
			
 
				+    """ Interpolates over every image channel
			
 
				+    http://en.wikipedia.org/wiki/Bilinear_interpolation
			
 
				+    :param img: max 3 channel image
			
 
				+    :param coords: 2 x _m_ array. 1st row = xcoords, 2nd row = ycoords
			
 
				+    :returns: array of interpolated pixels with same shape as coords
			
 
				+    """
			
 
				+    int_coords = np.int32(coords)
			
 
				+    x0, y0 = int_coords
			
 
				+    dx, dy = coords - int_coords
			
 
				+
			
 
				+    # 4 Neighour pixels
			
 
				+    q11 = img[y0, x0]
			
 
				+    q21 = img[y0, x0 + 1]
			
 
				+    q12 = img[y0 + 1, x0]
			
 
				+    q22 = img[y0 + 1, x0 + 1]
			
 
				+
			
 
				+    btm = q21.T * dx + q11.T * (1 - dx)
			
 
				+    top = q22.T * dx + q12.T * (1 - dx)
			
 
				+    inter_pixel = top * dy + btm * (1 - dy)
			
 
				+
			
 
				+    return inter_pixel.T
			
 
				+
			
 
				+def grid_coordinates(points):
			
 
				+    """ x,y grid coordinates within the ROI of supplied points
			
 
				+    :param points: points to generate grid coordinates
			
 
				+    :returns: array of (x, y) coordinates
			
 
				+    """
			
 
				+    xmin = np.min(points[:, 0])
			
 
				+    xmax = np.max(points[:, 0]) + 1
			
 
				+    ymin = np.min(points[:, 1])
			
 
				+    ymax = np.max(points[:, 1]) + 1
			
 
				+
			
 
				+    return np.asarray([(x, y) for y in range(ymin, ymax)
			
 
				+                       for x in range(xmin, xmax)], np.uint32)
			
 
				+
			
 
				+
			
 
				+def process_warp(src_img, result_img, tri_affines, dst_points, delaunay):
			
 
				+    """
			
 
				+    Warp each triangle from the src_image only within the
			
 
				+    ROI of the destination image (points in dst_points).
			
 
				+    """
			
 
				+    roi_coords = grid_coordinates(dst_points)
			
 
				+    # indices to vertices. -1 if pixel is not in any triangle
			
 
				+    roi_tri_indices = delaunay.find_simplex(roi_coords)
			
 
				+
			
 
				+    for simplex_index in range(len(delaunay.simplices)):
			
 
				+        coords = roi_coords[roi_tri_indices == simplex_index]
			
 
				+        num_coords = len(coords)
			
 
				+        out_coords = np.dot(tri_affines[simplex_index],
			
 
				+                            np.vstack((coords.T, np.ones(num_coords))))
			
 
				+        x, y = coords.T
			
 
				+        result_img[y, x] = bilinear_interpolate(src_img, out_coords)
			
 
				+
			
 
				+    return None
			
 
				+
			
 
				+
			
 
				+def triangular_affine_matrices(vertices, src_points, dst_points):
			
 
				+    """
			
 
				+    Calculate the affine transformation matrix for each
			
 
				+    triangle (x,y) vertex from dst_points to src_points
			
 
				+    :param vertices: array of triplet indices to corners of triangle
			
 
				+    :param src_points: array of [x, y] points to landmarks for source image
			
 
				+    :param dst_points: array of [x, y] points to landmarks for destination image
			
 
				+    :returns: 2 x 3 affine matrix transformation for a triangle
			
 
				+    """
			
 
				+    ones = [1, 1, 1]
			
 
				+    for tri_indices in vertices:
			
 
				+        src_tri = np.vstack((src_points[tri_indices, :].T, ones))
			
 
				+        dst_tri = np.vstack((dst_points[tri_indices, :].T, ones))
			
 
				+        mat = np.dot(src_tri, np.linalg.inv(dst_tri))[:2, :]
			
 
				+        yield mat
			
 
				+
			
 
				+
			
 
				+def warp_image_3d(src_img, src_points, dst_points, dst_shape, dtype=np.uint8):
			
 
				+    rows, cols = dst_shape[:2]
			
 
				+    result_img = np.zeros((rows, cols, 3), dtype=dtype)
			
 
				+
			
 
				+    delaunay = spatial.Delaunay(dst_points)
			
 
				+    tri_affines = np.asarray(list(triangular_affine_matrices(
			
 
				+        delaunay.simplices, src_points, dst_points)))
			
 
				+
			
 
				+    process_warp(src_img, result_img, tri_affines, dst_points, delaunay)
			
 
				+
			
 
				+    return result_img
			
 
				+
			
 
				+
			
 
				+## 2D Transform
			
 
				+def transformation_from_points(points1, points2):
			
 
				+    points1 = points1.astype(np.float64)
			
 
				+    points2 = points2.astype(np.float64)
			
 
				+
			
 
				+    c1 = np.mean(points1, axis=0)
			
 
				+    c2 = np.mean(points2, axis=0)
			
 
				+    points1 -= c1
			
 
				+    points2 -= c2
			
 
				+
			
 
				+    s1 = np.std(points1)
			
 
				+    s2 = np.std(points2)
			
 
				+    points1 /= s1
			
 
				+    points2 /= s2
			
 
				+
			
 
				+    U, S, Vt = np.linalg.svd(np.dot(points1.T, points2))
			
 
				+    R = (np.dot(U, Vt)).T
			
 
				+
			
 
				+    return np.vstack([np.hstack([s2 / s1 * R,
			
 
				+                                (c2.T - np.dot(s2 / s1 * R, c1.T))[:, np.newaxis]]),
			
 
				+                      np.array([[0., 0., 1.]])])
			
 
				+
			
 
				+
			
 
				+def warp_image_2d(im, M, dshape):
			
 
				+    output_im = np.zeros(dshape, dtype=im.dtype)
			
 
				+    cv2.warpAffine(im,
			
 
				+                   M[:2],
			
 
				+                   (dshape[1], dshape[0]),
			
 
				+                   dst=output_im,
			
 
				+                   borderMode=cv2.BORDER_TRANSPARENT,
			
 
				+                   flags=cv2.WARP_INVERSE_MAP)
			
 
				+
			
 
				+    return output_im
			
 
				+
			
 
				+
			
 
				+## Generate Mask
			
 
				+def mask_from_points(size, points,erode_flag=1):
			
 
				+    radius = 10  # kernel size
			
 
				+    kernel = np.ones((radius, radius), np.uint8)
			
 
				+
			
 
				+    mask = np.zeros(size, np.uint8)
			
 
				+    cv2.fillConvexPoly(mask, cv2.convexHull(points), 255)
			
 
				+    if erode_flag:
			
 
				+        mask = cv2.erode(mask, kernel,iterations=1)
			
 
				+
			
 
				+    return mask
			
 
				+
			
 
				+
			
 
				+## Color Correction
			
 
				+def correct_colours(im1, im2, landmarks1):
			
 
				+    COLOUR_CORRECT_BLUR_FRAC = 0.75
			
 
				+    LEFT_EYE_POINTS = list(range(42, 48))
			
 
				+    RIGHT_EYE_POINTS = list(range(36, 42))
			
 
				+
			
 
				+    blur_amount = COLOUR_CORRECT_BLUR_FRAC * np.linalg.norm(
			
 
				+                              np.mean(landmarks1[LEFT_EYE_POINTS], axis=0) -
			
 
				+                              np.mean(landmarks1[RIGHT_EYE_POINTS], axis=0))
			
 
				+    blur_amount = int(blur_amount)
			
 
				+    if blur_amount % 2 == 0:
			
 
				+        blur_amount += 1
			
 
				+    im1_blur = cv2.GaussianBlur(im1, (blur_amount, blur_amount), 0)
			
 
				+    im2_blur = cv2.GaussianBlur(im2, (blur_amount, blur_amount), 0)
			
 
				+
			
 
				+    # Avoid divide-by-zero errors.
			
 
				+    im2_blur = im2_blur.astype(int)
			
 
				+    im2_blur += 128*(im2_blur <= 1)
			
 
				+
			
 
				+    result = im2.astype(np.float64) * im1_blur.astype(np.float64) / im2_blur.astype(np.float64)
			
 
				+    result = np.clip(result, 0, 255).astype(np.uint8)
			
 
				+
			
 
				+    return result
			
 
				+
			
 
				+
			
 
				+## Copy-and-paste
			
 
				+def apply_mask(img, mask):
			
 
				+    """ Apply mask to supplied image
			
 
				+    :param img: max 3 channel image
			
 
				+    :param mask: [0-255] values in mask
			
 
				+    :returns: new image with mask applied
			
 
				+    """
			
 
				+    masked_img=cv2.bitwise_and(img,img,mask=mask)
			
 
				+
			
 
				+    return masked_img
			
 
				+
			
 
				+
			
 
				+## Alpha blending
			
 
				+def alpha_feathering(src_img, dest_img, img_mask, blur_radius=15):
			
 
				+    mask = cv2.blur(img_mask, (blur_radius, blur_radius))
			
 
				+    mask = mask / 255.0
			
 
				+
			
 
				+    result_img = np.empty(src_img.shape, np.uint8)
			
 
				+    for i in range(3):
			
 
				+        result_img[..., i] = src_img[..., i] * mask + dest_img[..., i] * (1-mask)
			
 
				+
			
 
				+    return result_img
			
 
				+
			
 
				+
			
 
				+def check_points(img,points):
			
 
				+    # Todo: I just consider one situation.
			
 
				+    if points[8,1]>img.shape[0]:
			
 
				+        logging.error("Jaw part out of image")
			
 
				+    else:
			
 
				+        return True
			
 
				+    return False
			
 
				+
			
 
				+
			
 
				+def face_swap(src_face, dst_face, src_points, dst_points, dst_shape, dst_img, args, end=48):
			
 
				+    h, w = dst_face.shape[:2]
			
 
				+
			
 
				+    ## 3d warp
			
 
				+    warped_src_face = warp_image_3d(src_face, src_points[:end], dst_points[:end], (h, w))
			
 
				+    ## Mask for blending
			
 
				+    mask = mask_from_points((h, w), dst_points)
			
 
				+    mask_src = np.mean(warped_src_face, axis=2) > 0
			
 
				+    mask = np.asarray(mask * mask_src, dtype=np.uint8)
			
 
				+    ## Correct color
			
 
				+    if args.correct_color:
			
 
				+        warped_src_face = apply_mask(warped_src_face, mask)
			
 
				+        dst_face_masked = apply_mask(dst_face, mask)
			
 
				+        warped_src_face = correct_colours(dst_face_masked, warped_src_face, dst_points)
			
 
				+    ## 2d warp
			
 
				+    if args.warp_2d:
			
 
				+        unwarped_src_face = warp_image_3d(warped_src_face, dst_points[:end], src_points[:end], src_face.shape[:2])
			
 
				+        warped_src_face = warp_image_2d(unwarped_src_face, transformation_from_points(dst_points, src_points),
			
 
				+                                        (h, w, 3))
			
 
				+
			
 
				+        mask = mask_from_points((h, w), dst_points)
			
 
				+        mask_src = np.mean(warped_src_face, axis=2) > 0
			
 
				+        mask = np.asarray(mask * mask_src, dtype=np.uint8)
			
 
				+
			
 
				+    ## Shrink the mask
			
 
				+    kernel = np.ones((10, 10), np.uint8)
			
 
				+    mask = cv2.erode(mask, kernel, iterations=1)
			
 
				+    ##Poisson Blending
			
 
				+    r = cv2.boundingRect(mask)
			
 
				+    center = ((r[0] + int(r[2] / 2), r[1] + int(r[3] / 2)))
			
 
				+    output = cv2.seamlessClone(warped_src_face, dst_face, mask, center, cv2.NORMAL_CLONE)
			
 
				+
			
 
				+    x, y, w, h = dst_shape
			
 
				+    dst_img_cp = dst_img.copy()
			
 
				+    dst_img_cp[y:y + h, x:x + w] = output
			
 
				+
			
 
				+    return dst_img_cp
			
--- a/imgs/68points.JPG
+++ b/imgs/68points.JPG
--- a/imgs/face.png
+++ b/imgs/face.png
--- a/imgs/landmark_vis.JPG
+++ b/imgs/landmark_vis.JPG
--- a/imgs/target.png
+++ b/imgs/target.png
--- a/imgs/test1.jpg
+++ b/imgs/test1.jpg
--- a/imgs/test2.jpg
+++ b/imgs/test2.jpg
--- a/imgs/test3.jpg
+++ b/imgs/test3.jpg
--- a/imgs/test4.jpg
+++ b/imgs/test4.jpg
--- a/imgs/test5.jpg
+++ b/imgs/test5.jpg
--- a/imgs/test6.jpg
+++ b/imgs/test6.jpg
--- a/imgs/test7.jpg
+++ b/imgs/test7.jpg
--- a/imgs/test7_.jpg
+++ b/imgs/test7_.jpg
--- a/imgs/test8.jpg
+++ b/imgs/test8.jpg
--- a/main.py
+++ b/main.py
@@ -0,0 +1,69 @@
 
				+#! /usr/bin/env python
			
 
				+import os
			
 
				+import cv2
			
 
				+import argparse
			
 
				+import numpy as np
			
 
				+
			
 
				+from face_detection import select_face, mask_mouth
			
 
				+from face_swap import face_swap
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    parser = argparse.ArgumentParser(description='FaceSwapApp')
			
 
				+    parser.add_argument('--src', required=True, help='Path for source image')
			
 
				+    parser.add_argument('--dst', required=True, help='Path for target image')
			
 
				+    parser.add_argument('--out', required=True, help='Path for storing output images')
			
 
				+    parser.add_argument('--point_plot', default=False, help='facial landmark visualizations')
			
 
				+    parser.add_argument('--warp_2d', default=False, action='store_true', help='2d or 3d warp')
			
 
				+    parser.add_argument('--correct_color', default=False, action='store_true', help='Correct color')
			
 
				+    parser.add_argument('--no_debug_window', default=False, action='store_true', help='Don\'t show debug window')
			
 
				+    args = parser.parse_args()
			
 
				+
			
 
				+    # Read images
			
 
				+    src_img = cv2.imread(args.src)
			
 
				+    src_img_mask = mask_mouth(args.src)
			
 
				+    dst_img = cv2.imread(args.dst)
			
 
				+
			
 
				+    # Select src face
			
 
				+    src_points, src_shape, src_face = select_face(src_img_mask)
			
 
				+    # Select dst face
			
 
				+    dst_points, dst_shape, dst_face = select_face(dst_img)
			
 
				+
			
 
				+    if src_points is None or dst_points is None:
			
 
				+        print('Detect 0 Face !!!')
			
 
				+        exit(-1)
			
 
				+
			
 
				+    output = face_swap(src_face, dst_face, src_points, dst_points, dst_shape, dst_img, args)
			
 
				+
			
 
				+    dir_path = os.path.dirname(args.out)
			
 
				+    if not os.path.isdir(dir_path):
			
 
				+        os.makedirs(dir_path)
			
 
				+
			
 
				+    cv2.imwrite(args.out, output)
			
 
				+
			
 
				+    ##For debug
			
 
				+    if not args.no_debug_window:
			
 
				+        if args.point_plot:
			
 
				+            tmp_img=src_img.copy()
			
 
				+            x, y, w, h = src_shape
			
 
				+
			
 
				+            for point in src_points:
			
 
				+                x_, y_ = point.tolist()
			
 
				+                cv2.circle(tmp_img, [x_+x,y_+y], 6,  (0,0,255), -1)
			
 
				+                cv2.circle(tmp_img, [x_+x,y_+y], 3,  (255,255,255), -1)
			
 
				+
			
 
				+            tmp_img2=dst_img.copy()
			
 
				+            x, y, w, h = dst_shape
			
 
				+            for point in dst_points:
			
 
				+                x_, y_ = point.tolist()
			
 
				+                cv2.circle(tmp_img2, [x_+x,y_+y], 6,  (0,0,255), -1)
			
 
				+                cv2.circle(tmp_img2, [x_+x,y_+y], 3,  (255,255,255), -1)
			
 
				+
			
 
				+            result=np.hstack((tmp_img, tmp_img2, output))
			
 
				+        else:
			
 
				+            result=np.hstack((src_img, dst_img, output))
			
 
				+        cv2.namedWindow('result', 0)
			
 
				+        cv2.imshow("result", result)
			
 
				+        cv2.waitKey(0)
			
 
				+        
			
 
				+        cv2.destroyAllWindows()
			
--- a/models/shape_predictor_68_face_landmarks.dat
+++ b/models/shape_predictor_68_face_landmarks.dat
--- a/requirements.txt
+++ b/requirements.txt
@@ -0,0 +1,4 @@
 
				+dlib >= 19.9.0
			
 
				+numpy >= 1.13.1
			
 
				+scipy >= 0.18.0
			
 
				+imutils==0.5.4