Spaces:

dreamlessx
/

LandmarkDiff

Running

App Files Files Community

dreamlessx commited on Mar 14

Commit

b46d78e

verified ·

1 Parent(s): ff7e8d0

Upload landmarkdiff/landmarks.py with huggingface_hub

Browse files

Files changed (1) hide show

landmarkdiff/landmarks.py +258 -0

landmarkdiff/landmarks.py ADDED Viewed

	@@ -0,0 +1,258 @@

+"""MediaPipe Face Mesh v2 landmark extraction."""
+from __future__ import annotations
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Optional
+import cv2
+import mediapipe as mp
+import numpy as np
+# Region color map for visualization (BGR)
+REGION_COLORS: dict[str, tuple[int, int, int]] = {
+    "jawline": (255, 255, 255),     # white
+    "eyebrow_left": (0, 255, 0),    # green
+    "eyebrow_right": (0, 255, 0),
+    "eye_left": (255, 255, 0),      # cyan
+    "eye_right": (255, 255, 0),
+    "nose": (0, 255, 255),          # yellow
+    "lips": (0, 0, 255),            # red
+    "iris_left": (255, 0, 255),     # magenta
+    "iris_right": (255, 0, 255),
+    "face_oval": (200, 200, 200),   # light gray
+}
+# MediaPipe landmark index groups by anatomical region
+LANDMARK_REGIONS: dict[str, list[int]] = {
+    "jawline": [
+        10, 338, 297, 332, 284, 251, 389, 356, 454, 323, 361, 288,
+        397, 365, 379, 378, 400, 377, 152, 148, 176, 149, 150, 136,
+        172, 58, 132, 93, 234, 127, 162, 21, 54, 103, 67, 109,
+    ],
+    "eye_left": [
+        33, 7, 163, 144, 145, 153, 154, 155, 133, 173, 157, 158, 159, 160, 161, 246,
+    ],
+    "eye_right": [
+        362, 382, 381, 380, 374, 373, 390, 249, 263, 466, 388, 387, 386, 385, 384, 398,
+    ],
+    "eyebrow_left": [70, 63, 105, 66, 107, 55, 65, 52, 53, 46],
+    "eyebrow_right": [300, 293, 334, 296, 336, 285, 295, 282, 283, 276],
+    "nose": [
+        1, 2, 4, 5, 6, 19, 94, 141, 168, 195, 197, 236, 240,
+        274, 275, 278, 279, 294, 326, 327, 360, 363, 370, 456, 460,
+    ],
+    "lips": [
+        61, 146, 91, 181, 84, 17, 314, 405, 321, 375, 291,
+        308, 324, 318, 402, 317, 14, 87, 178, 88, 95, 78,
+    ],
+    "iris_left": [468, 469, 470, 471, 472],
+    "iris_right": [473, 474, 475, 476, 477],
+}
+@dataclass(frozen=True)
+class FaceLandmarks:
+    """478 face landmarks + image size + detection confidence."""
+    landmarks: np.ndarray  # (478, 3) normalized (x, y, z)
+    image_width: int
+    image_height: int
+    confidence: float
+    @property
+    def pixel_coords(self) -> np.ndarray:
+        """Normalized -> pixel coords, shape (478, 2)."""
+        coords = self.landmarks[:, :2].copy()
+        coords[:, 0] *= self.image_width
+        coords[:, 1] *= self.image_height
+        return coords
+    def get_region(self, region: str) -> np.ndarray:
+        """Return landmarks for the given region name."""
+        indices = LANDMARK_REGIONS.get(region, [])
+        return self.landmarks[indices]
+def extract_landmarks(
+    image: np.ndarray,
+    min_detection_confidence: float = 0.5,
+    min_tracking_confidence: float = 0.5,
+) -> Optional[FaceLandmarks]:
+    """Run MediaPipe Face Mesh on a BGR image, return FaceLandmarks or None."""
+    h, w = image.shape[:2]
+    rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    # Tasks API first, fall back to legacy solutions API
+    try:
+        landmarks, confidence = _extract_tasks_api(rgb, min_detection_confidence)
+    except Exception:
+        try:
+            landmarks, confidence = _extract_solutions_api(rgb, min_detection_confidence, min_tracking_confidence)
+        except Exception:
+            return None
+    if landmarks is None:
+        return None
+    return FaceLandmarks(
+        landmarks=landmarks,
+        image_width=w,
+        image_height=h,
+        confidence=confidence,
+    )
+def _extract_tasks_api(
+    rgb: np.ndarray,
+    min_confidence: float,
+) -> tuple[Optional[np.ndarray], float]:
+    """Tasks API path (mediapipe >= 0.10.20)."""
+    FaceLandmarker = mp.tasks.vision.FaceLandmarker
+    FaceLandmarkerOptions = mp.tasks.vision.FaceLandmarkerOptions
+    RunningMode = mp.tasks.vision.RunningMode
+    BaseOptions = mp.tasks.BaseOptions
+    import urllib.request
+    import tempfile
+    # Download model if not cached
+    model_path = Path(tempfile.gettempdir()) / "face_landmarker_v2_with_blendshapes.task"
+    if not model_path.exists():
+        url = "https://storage.googleapis.com/mediapipe-models/face_landmarker/face_landmarker/float16/1/face_landmarker.task"
+        urllib.request.urlretrieve(url, str(model_path))
+    options = FaceLandmarkerOptions(
+        base_options=BaseOptions(model_asset_path=str(model_path)),
+        running_mode=RunningMode.IMAGE,
+        num_faces=1,
+        min_face_detection_confidence=min_confidence,
+        output_face_blendshapes=False,
+        output_facial_transformation_matrixes=False,
+    )
+    with FaceLandmarker.create_from_options(options) as landmarker:
+        mp_image = mp.Image(image_format=mp.ImageFormat.SRGB, data=rgb)
+        result = landmarker.detect(mp_image)
+    if not result.face_landmarks:
+        return None, 0.0
+    face_lms = result.face_landmarks[0]
+    landmarks = np.array(
+        [(lm.x, lm.y, lm.z) for lm in face_lms],
+        dtype=np.float32,
+    )
+    return landmarks, min_confidence
+def _extract_solutions_api(
+    rgb: np.ndarray,
+    min_detection_confidence: float,
+    min_tracking_confidence: float,
+) -> tuple[Optional[np.ndarray], float]:
+    """Legacy solutions API fallback."""
+    with mp.solutions.face_mesh.FaceMesh(
+        static_image_mode=True,
+        max_num_faces=1,
+        refine_landmarks=True,
+        min_detection_confidence=min_detection_confidence,
+        min_tracking_confidence=min_tracking_confidence,
+    ) as face_mesh:
+        results = face_mesh.process(rgb)
+    if not results.multi_face_landmarks:
+        return None, 0.0
+    face = results.multi_face_landmarks[0]
+    landmarks = np.array(
+        [(lm.x, lm.y, lm.z) for lm in face.landmark],
+        dtype=np.float32,
+    )
+    return landmarks, min(min_detection_confidence, min_tracking_confidence)
+def visualize_landmarks(
+    image: np.ndarray,
+    face: FaceLandmarks,
+    radius: int = 1,
+    draw_regions: bool = True,
+) -> np.ndarray:
+    """Draw colored landmark dots on a copy of the image."""
+    canvas = image.copy()
+    coords = face.pixel_coords
+    if draw_regions:
+        # Build index -> color mapping
+        idx_to_color: dict[int, tuple[int, int, int]] = {}
+        for region, indices in LANDMARK_REGIONS.items():
+            color = REGION_COLORS.get(region, (255, 255, 255))
+            for idx in indices:
+                idx_to_color[idx] = color
+        for i, (x, y) in enumerate(coords):
+            color = idx_to_color.get(i, (128, 128, 128))
+            cv2.circle(canvas, (int(x), int(y)), radius, color, -1)
+    else:
+        for x, y in coords:
+            cv2.circle(canvas, (int(x), int(y)), radius, (255, 255, 255), -1)
+    return canvas
+def render_landmark_image(
+    face: FaceLandmarks,
+    width: Optional[int] = None,
+    height: Optional[int] = None,
+    radius: int = 2,
+) -> np.ndarray:
+    """Render tessellation mesh on black canvas. Falls back to dots if no connections."""
+    w = width or face.image_width
+    h = height or face.image_height
+    canvas = np.zeros((h, w, 3), dtype=np.uint8)
+    coords = face.landmarks[:, :2].copy()
+    coords[:, 0] *= w
+    coords[:, 1] *= h
+    pts = coords.astype(np.int32)
+    # Draw tessellation mesh (what CrucibleAI ControlNet expects)
+    try:
+        from mediapipe.tasks.python.vision.face_landmarker import FaceLandmarksConnections
+        tessellation = FaceLandmarksConnections.FACE_LANDMARKS_TESSELATION
+        contours = FaceLandmarksConnections.FACE_LANDMARKS_CONTOURS
+        # Draw tessellation edges (thin, gray-white)
+        for conn in tessellation:
+            p1 = tuple(pts[conn.start])
+            p2 = tuple(pts[conn.end])
+            cv2.line(canvas, p1, p2, (192, 192, 192), 1, cv2.LINE_AA)
+        # Draw contour edges on top (brighter, key features)
+        for conn in contours:
+            p1 = tuple(pts[conn.start])
+            p2 = tuple(pts[conn.end])
+            cv2.line(canvas, p1, p2, (255, 255, 255), 1, cv2.LINE_AA)
+    except ImportError:
+        # Fallback: draw colored dots if tessellation not available
+        idx_to_color: dict[int, tuple[int, int, int]] = {}
+        for region, indices in LANDMARK_REGIONS.items():
+            color = REGION_COLORS.get(region, (128, 128, 128))
+            for idx in indices:
+                idx_to_color[idx] = color
+        for i, (x, y) in enumerate(coords):
+            color = idx_to_color.get(i, (128, 128, 128))
+            cv2.circle(canvas, (int(x), int(y)), radius, color, -1)
+    return canvas
+def load_image(path: str | Path) -> np.ndarray:
+    """Load image as BGR numpy array, raises FileNotFoundError on failure."""
+    img = cv2.imread(str(path))
+    if img is None:
+        raise FileNotFoundError(f"Could not load image: {path}")
+    return img