Spaces:

Robys01
/

Face-Morphing

Running

App Files Files Community

Robys01 commited on Jun 29, 2024

Commit

cf27ba5

verified ·

1 Parent(s): ad14814

Upload code

Browse files

Files changed (8) hide show

examples/1.png +0 -0
examples/2.png +0 -0
examples/3.png +0 -0
src/README.md +9 -0
src/__init__.py +4 -0
src/face_morp.py +155 -0
src/landmark_detector.py +109 -0
src/process_images.py +43 -0

examples/1.png ADDED Viewed

examples/2.png ADDED Viewed

examples/3.png ADDED Viewed

src/README.md ADDED Viewed

	@@ -0,0 +1,9 @@

+# Requirements
+```
+python=3.11.9
+mediapipe
+```
+```
+python mycode/main.py mycode/input_aligned --frames 30 --duration 3 --verbose
+```

src/__init__.py ADDED Viewed

	@@ -0,0 +1,4 @@


1	+
2	+
3	+ if __name__ == '__main__':
4	+ print("This is a placeholder for the main function")

src/face_morp.py ADDED Viewed

	@@ -0,0 +1,155 @@

+import cv2
+import time
+import numpy as np
+from tqdm import tqdm
+from scipy.spatial import Delaunay
+from concurrent.futures import ProcessPoolExecutor
+from src.process_images import get_images_and_landmarks
+def morph(image_files, duration, frame_rate, output, guideline, is_dlib):
+    # Get the list of images and landmarks
+    images_list, landmarks_list = get_images_and_landmarks(image_files, is_dlib)
+    video_frames = []   # List of frames for the video
+    sequence_time = time.time()
+    print("Generating morph sequence...", end="\n\n")
+    # Use ProcessPoolExecutor to parallelize the generation of morph sequences
+    with ProcessPoolExecutor() as executor:
+        futures = []
+        for i in range(1, len(images_list)):
+            src_image, src_landmarks = images_list[i-1], landmarks_list[i-1]
+            dst_image, dst_landmarks = images_list[i], landmarks_list[i]
+            # Generate Delaunay Triangulation
+            tri = Delaunay(dst_landmarks).simplices
+            # Submit the task to the executor
+            futures.append((i, executor.submit(generate_morph_sequence, duration, frame_rate, src_image, dst_image, src_landmarks, dst_landmarks, tri, guideline)))
+        # Retrieve and store the results in the correct order
+        results = [None] * (len(images_list) - 1)
+        for idx, future in futures:
+            results[idx - 1] = future.result()
+        for sequence_frames in results:
+            video_frames.extend(sequence_frames)
+    print(f"Total time taken to generate morph sequence: {time.time() - sequence_time:.2f} seconds", end="\n\n")
+    # Write the frames to a video file
+    write_frames_to_video(video_frames, frame_rate, output)
+def generate_morph_sequence(duration, frame_rate, image1, image2, landmarks1, landmarks2, tri, guideline):
+    num_frames = int(duration * frame_rate)
+    morphed_frames = []
+    for frame in range(num_frames):
+        alpha = frame / (num_frames - 1)
+        # Working with floats for better precision
+        image1_float = np.float32(image1)
+        image2_float = np.float32(image2)
+        # Compute the intermediate landmarks at time alpha
+        landmarks = []
+        for i in range(len(landmarks1)):
+            x = (1 - alpha) * landmarks1[i][0] + alpha * landmarks2[i][0]
+            y = (1 - alpha) * landmarks1[i][1] + alpha * landmarks2[i][1]
+            landmarks.append((x, y))
+        # Allocate space for final output
+        morphed_frame = np.zeros_like(image1_float)
+        for i in range(len(tri)):
+            x = tri[i][0]
+            y = tri[i][1]
+            z = tri[i][2]
+            t1 = [landmarks1[x], landmarks1[y], landmarks1[z]]
+            t2 = [landmarks2[x], landmarks2[y], landmarks2[z]]
+            t = [landmarks[x], landmarks[y], landmarks[z]]
+            # Morph one triangle at a time.
+            morph_triangle(image1_float, image2_float, morphed_frame, t1, t2, t, alpha)
+            if guideline:
+                # Draw lines for the face landmarks
+                points = [(int(t[i][0]), int(t[i][1])) for i in range(3)]
+                for i in range(3):
+                    # image, (x1, y1), (x2, y2), color, thickness, lineType, shift
+                    cv2.line(morphed_frame, points[i], points[(i + 1) % 3], (255, 255, 255), 1, 8, 0)
+        # Convert the morphed image to RGB color space (from BGR)
+        morphed_frame = cv2.cvtColor(np.uint8(morphed_frame), cv2.COLOR_BGR2RGB)
+        morphed_frames.append(morphed_frame)
+    return morphed_frames
+def morph_triangle(image1, image2, morphed_image, t1, t2, t, alpha):
+    # Calculate bounding rectangles and offset points together
+    r, r1, r2 = [cv2.boundingRect(np.float32([tri])) for tri in [t, t1, t2]]
+    # Offset the triangle points by the top-left corner of the corresponding bounding rectangle
+    t_rect, t1_rect, t2_rect = [[(tri[i][0] - rect[0], tri[i][1] - rect[1]) for i in range(3)]
+                                    for tri, rect in zip([t, t1, t2], [r, r1, r2])]
+    # Create a mask to keep only the pixels inside the triangle
+    mask = np.zeros((r[3], r[2], 3), dtype=np.float32)
+    # Fill the mask with white pixels inside the triangle
+    cv2.fillConvexPoly(mask, np.int32(t_rect), (1.0, 1.0, 1.0), 16, 0)
+    # Extract the triangle from the first and second image
+    image1_rect = image1[r1[1]:r1[1]+r1[3], r1[0]:r1[0]+r1[2]]
+    image2_rect = image2[r2[1]:r2[1]+r2[3], r2[0]:r2[0]+r2[2]]
+    size = (r[2], r[3]) # Size of the bounding rectangle
+    # Apply affine transformation to warp the triangles from the source image to the destination image
+    warpImage1 = apply_affine_transform(image1_rect, t1_rect, t_rect, size)
+    warpImage2 = apply_affine_transform(image2_rect, t2_rect, t_rect, size)
+    # Perform alpha blending between the warped triangles and copy the result to the destination image
+    morphed_image_rect = warpImage1 * (1 - alpha) + warpImage2 * alpha
+    morphed_image[r[1]:r[1]+r[3], r[0]:r[0]+r[2]] = morphed_image[r[1]:r[1]+r[3], r[0]:r[0]+r[2]] * (1 - mask) + morphed_image_rect * mask
+    return morphed_image
+def apply_affine_transform(img, src, dst, size):
+    """
+    Apply an affine transformation to the image.
+    """
+    warp_matrix = cv2.getAffineTransform(np.float32(src), np.float32(dst))
+    return cv2.warpAffine(img, warp_matrix, (size[0], size[1]), None, flags=cv2.INTER_LINEAR, borderMode=cv2.BORDER_REPLICATE)
+def write_frames_to_video(frames, frame_rate, output):
+    # Get the height and width of the frames
+    height, width, _ = frames[0].shape
+    # Cut the outside pixels to remove the black border
+    pad = 2
+    new_height = height - pad * 2
+    new_width = width - pad * 2
+    # Initialize the video writer
+    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
+    out = cv2.VideoWriter(output, fourcc, frame_rate, (new_width, new_height))
+    # Write the frames to the video
+    print("Writing frames to video...")
+    for frame in tqdm(frames):
+        # Cut the outside pixels
+        cut_frame = frame[pad:new_height+pad, pad:new_width+pad]
+        out.write(cut_frame)
+    out.release()
+    print(f"Video saved at: {output}")

src/landmark_detector.py ADDED Viewed

	@@ -0,0 +1,109 @@

+import os
+import cv2
+import dlib
+import mediapipe as mp
+def read_image(image_path):
+    """
+    Read an image from the given path and convert it to RGB.
+    """
+    image = cv2.imread(image_path)
+    if image is None:
+        raise FileNotFoundError(f"Image not found at path: {image_path}")
+    return cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+class DlibLandmarkDetector:
+    def __init__(self, predictor_model_path=f'{os.path.dirname(os.path.abspath(__file__))}/utils/shape_predictor_68_face_landmarks.dat'):
+        """
+        :param predictor_model_path: path to shape_predictor_68_face_landmarks.dat file
+        """
+        self.detector = dlib.get_frontal_face_detector() # cnn_face_detection_model_v1 also can be used
+        self.predictor = dlib.shape_predictor(predictor_model_path)
+    def get_landmarks(self, image_path):
+        # image = dlib.load_rgb_image(image_path)
+        image = read_image(image_path)
+        height, width, _ = image.shape
+        # Detect the faces in the image
+        dets = self.detector(image, 1)  # 1 indicates to upsample the image 1 time. Higher values may give better results
+        # Raise an exception if no face is detected
+        if len(dets) == 0:
+            raise Exception("No face detected in the image at path: ", image_path)
+        # Get the landmarks of the first face detected
+        face_landmarks = [(item.x, item.y) for item in self.predictor(image, dets[0]).parts()]
+        # Add corner and edge midpoints as landmarks to include the background
+        corner_landmarks = [(1, 1),  (1, height - 1), (width - 1, 1), (width - 1, height - 1)]
+        edge_landmarks = [(1, (height - 1)//2), ((width - 1)//2, 1), ((width - 1)//2, height - 1), (width - 1, (height - 1)//2)]
+        # Concatenate the landmarks
+        landmarks = face_landmarks + corner_landmarks + edge_landmarks
+        return landmarks, image
+    def show_landmarked_image(self, image_path, landmarks):
+        image = read_image(image_path)
+        for landmark in landmarks:
+            x, y = landmark
+            cv2.circle(image, (x, y), 1, (255, 255, 0), -1) # image, (x, y), radius, color, thickness (-1 to fill)
+        cv2.imshow('image', image)
+        cv2.waitKey(0)
+        cv2.destroyAllWindows()
+class  MediaPipeLandmarkDetector:
+    def __init__(self):
+        self.face_mesh = mp.solutions.face_mesh.FaceMesh(
+            static_image_mode=True,
+            max_num_faces=1,
+            min_detection_confidence=0.5)
+    def get_landmarks(self, image_path):
+        image = read_image(image_path)
+        height, width, _ = image.shape
+        image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+        # Process the image
+        results = self.face_mesh.process(image_rgb)
+        # Raise an exception if no face is detected
+        if results.multi_face_landmarks is None:
+            raise Exception("No face detected in the image at path: ", image_path)
+        # Extract the face landmarks
+        face_landmarks = results.multi_face_landmarks[0]
+        face_landmarks_normalized = [[landmark.x , landmark.y] for landmark in face_landmarks.landmark]
+        # Add corner and edge midpoints as landmarks to include the background
+        corner_landmarks = [(0, 0), (0, 1), (1, 0), (1, 1)]
+        edge_landmarks = [(0, 0.5), (0.5, 0), (0.5, 1), (1, 0.5)]
+        # Concatenate the corner and edge landmarks
+        landmarks = corner_landmarks + edge_landmarks + face_landmarks_normalized
+        # Multiply the landmarks with the image dimensions
+        landmarks = [(int(x * width) - 1, int(y * height) - 1) for x, y in landmarks]
+        landmarks = [(max(1, x), max(1, y)) for x, y in landmarks]
+        return landmarks, image
+    def show_landmarked_image(self, image_path, landmarks):
+        image = cv2.imread(image_path)
+        for landmark in landmarks:
+            x, y = landmark
+            cv2.circle(image, (x, y), 1, (255, 255, 0), -1)
+        cv2.imshow('image', image)
+        cv2.waitKey(0)
+        cv2.destroyAllWindows()

src/process_images.py ADDED Viewed

	@@ -0,0 +1,43 @@

+import os
+from tqdm import tqdm
+from src.landmark_detector import MediaPipeLandmarkDetector, DlibLandmarkDetector
+def get_images_and_landmarks(image_list, is_dlib):
+    # Get the list of images in the directory
+    image_paths = []
+    for file in image_list:
+        if file.endswith(".jpg") or file.endswith(".png"):
+            image_paths.append(file)
+        else:
+            print(f"Skipping file: {file}. Not a supported image format. (jpg or png)")
+    if len(image_paths) < 2:
+        raise ValueError("At least two images are required for morphing.")
+        # exit()
+    landmarks_list = [] # List of landmarks for each image
+    images_list = []    # List of images
+    # Initialize the landmark detector
+    landmark_detector = DlibLandmarkDetector() if is_dlib else MediaPipeLandmarkDetector()
+    print("Generating landmarks for the images...")
+    # Detect landmarks for each image
+    for image_path in tqdm(image_paths):
+        try:
+            landmarks, image = landmark_detector.get_landmarks(image_path)
+            landmarks_list.append(landmarks)
+            images_list.append(image)
+        except Exception as e:
+            print(f"{e} \nSkipping image: {image_path}\n")
+            continue
+    if len(landmarks_list) < 2:
+        raise ValueError("At least two faces are required for morphing.")
+        # exit()
+    return images_list, landmarks_list