Spaces:

VanNguyen1214
/

ghep_image

Running

App Files Files Community

VanNguyen1214 commited on 10 days ago

Commit

a3f5fed

verified ·

1 Parent(s): 5f52a7e

Update segmentation.py

Browse files

Files changed (1) hide show

segmentation.py +98 -29

segmentation.py CHANGED Viewed

@@ -1,87 +1,156 @@
 import numpy as np
-import torch
-import torch.nn.functional as F
 import cv2
 from PIL import Image
-from transformers import SegformerImageProcessor, AutoModelForSemanticSegmentation
 import mediapipe as mp
-# SegFormer để phân vùng tóc
 processor = SegformerImageProcessor.from_pretrained("VanNguyen1214/get_face_and_hair")
 model     = AutoModelForSemanticSegmentation.from_pretrained("VanNguyen1214/get_face_and_hair")
 mp_face_mesh = mp.solutions.face_mesh
 def remove_hair_from_image(image: Image.Image) -> Image.Image:
     rgb = image.convert("RGB")
-    arr = np.array(rgb); h, w = arr.shape[:2]
     inputs = processor(images=rgb, return_tensors="pt")
     with torch.no_grad():
         logits = model(**inputs).logits.cpu()
     up = F.interpolate(logits, size=(h, w), mode="bilinear", align_corners=False)
-    pred = up.argmax(dim=1)[0].numpy()
-    hair_mask = (pred == 2).astype(np.uint8)
-    alpha = np.full((h, w), 255, np.uint8)
-    alpha[hair_mask > 0] = 0
     rgba = np.dstack([arr, alpha])
     return Image.fromarray(rgba)
 def get_facemesh_mask(image: Image.Image) -> np.ndarray:
     img = np.array(image.convert("RGB"))
     h, w = img.shape[:2]
-    mask = np.zeros((h, w), np.uint8)
     with mp_face_mesh.FaceMesh(
-        static_image_mode=True, max_num_faces=1,
-        refine_landmarks=True, min_detection_confidence=0.5
     ) as mesh:
         res = mesh.process(img)
         if res.multi_face_landmarks:
-            pts = [(int(lm.x*w), int(lm.y*h))
-                   for lm in res.multi_face_landmarks[0].landmark]
             hull = cv2.convexHull(np.array(pts, np.int32))
             cv2.fillConvexPoly(mask, hull, 1)
     return mask
-def expand_forehead_mask(face_mask: np.ndarray, pct: float=0.2) -> np.ndarray:
-    ys = np.where(face_mask>0)[0]
-    if ys.size==0: return face_mask
     y0, y1 = ys.min(), ys.max()
-    exp = int((y1-y0)*pct)
     top = max(y0 - exp, 0)
     out = np.zeros_like(face_mask)
-    out[top:top+(y1-y0)] = face_mask[y0:y1]
     return out
 def extract_face_and_forehead_no_hair(img: Image.Image) -> Image.Image:
     rgb = img.convert("RGB")
-    arr = np.array(rgb); h, w = arr.shape[:2]
-    # tóc
-    inp = processor(images=rgb, return_tensors="pt")
     with torch.no_grad():
-        logits = model(**inp).logits.cpu()
     up = F.interpolate(logits, size=(h, w), mode="bilinear", align_corners=False)
     seg = up.argmax(dim=1)[0].numpy()
     hair_mask = (seg == 2).astype(np.uint8)
-    # mặt+trán
     fm = get_facemesh_mask(img)
     fm_exp = expand_forehead_mask(fm, 0.2)
     fore = cv2.bitwise_and(fm_exp, 1 - fm)
     fore = cv2.bitwise_and(fore, 1 - hair_mask)
-    cm = ((fm + fore)>0).astype(np.uint8)
-    cm = cv2.GaussianBlur(cm.astype(np.float32),(3,3),0)
-    cm = (cm>0.5).astype(np.uint8)
     alpha = (cm * 255).astype(np.uint8)
     rgba  = np.dstack([arr, alpha])
     return Image.fromarray(rgba)
 def remove_face_using_segmentation(img: Image.Image) -> Image.Image:
     ff   = extract_face_and_forehead_no_hair(img)
-    mask = np.array(ff)[...,3] > 0
     ori  = img.convert("RGBA")
     arr  = np.array(ori)
-    arr[...,3][mask] = 0
     return Image.fromarray(arr)

+# segmentation.py
 import numpy as np
 import cv2
 from PIL import Image
+import torch
+import torch.nn.functional as F
 import mediapipe as mp
+from transformers import SegformerImageProcessor, AutoModelForSemanticSegmentation
+# SegFormer setup for hair segmentation
 processor = SegformerImageProcessor.from_pretrained("VanNguyen1214/get_face_and_hair")
 model     = AutoModelForSemanticSegmentation.from_pretrained("VanNguyen1214/get_face_and_hair")
+# MediaPipe FaceMesh for face+forehead mask
 mp_face_mesh = mp.solutions.face_mesh
 def remove_hair_from_image(image: Image.Image) -> Image.Image:
+    """
+    Remove hair: return RGBA with hair area transparent.
+    """
     rgb = image.convert("RGB")
+    arr = np.array(rgb)
+    h, w = arr.shape[:2]
+    # SegFormer hair mask
     inputs = processor(images=rgb, return_tensors="pt")
     with torch.no_grad():
         logits = model(**inputs).logits.cpu()
     up = F.interpolate(logits, size=(h, w), mode="bilinear", align_corners=False)
+    mask = up.argmax(dim=1)[0].numpy()
+    hair_mask = (mask == 2).astype(np.uint8)
+    alpha = np.full((h, w), 255, dtype=np.uint8)
+    alpha[hair_mask == 1] = 0
     rgba = np.dstack([arr, alpha])
     return Image.fromarray(rgba)
 def get_facemesh_mask(image: Image.Image) -> np.ndarray:
+    """
+    Return binary mask of face+forehead (no hair) using MediaPipe.
+    """
     img = np.array(image.convert("RGB"))
     h, w = img.shape[:2]
+    mask = np.zeros((h, w), dtype=np.uint8)
     with mp_face_mesh.FaceMesh(
+        static_image_mode=True,
+        max_num_faces=1,
+        refine_landmarks=True,
+        min_detection_confidence=0.5
     ) as mesh:
         res = mesh.process(img)
         if res.multi_face_landmarks:
+            pts = [(int(lm.x * w), int(lm.y * h)) for lm in res.multi_face_landmarks[0].landmark]
             hull = cv2.convexHull(np.array(pts, np.int32))
             cv2.fillConvexPoly(mask, hull, 1)
     return mask
+def expand_forehead_mask(face_mask: np.ndarray, pct: float = 0.2) -> np.ndarray:
+    """
+    Expand face mask upward to include forehead region.
+    """
+    ys = np.where(face_mask > 0)[0]
+    if ys.size == 0:
+        return face_mask
     y0, y1 = ys.min(), ys.max()
+    exp = int((y1 - y0) * pct)
     top = max(y0 - exp, 0)
     out = np.zeros_like(face_mask)
+    out[top:top + (y1 - y0)] = face_mask[y0:y1]
     return out
 def extract_face_and_forehead_no_hair(img: Image.Image) -> Image.Image:
+    """
+    Return RGBA where alpha=255 for face+forehead (no hair), alpha=0 elsewhere.
+    """
     rgb = img.convert("RGB")
+    arr = np.array(rgb)
+    h, w = arr.shape[:2]
+    # hair mask
+    inputs = processor(images=rgb, return_tensors="pt")
     with torch.no_grad():
+        logits = model(**inputs).logits.cpu()
     up = F.interpolate(logits, size=(h, w), mode="bilinear", align_corners=False)
     seg = up.argmax(dim=1)[0].numpy()
     hair_mask = (seg == 2).astype(np.uint8)
+    # face+forehead mask
     fm = get_facemesh_mask(img)
     fm_exp = expand_forehead_mask(fm, 0.2)
     fore = cv2.bitwise_and(fm_exp, 1 - fm)
     fore = cv2.bitwise_and(fore, 1 - hair_mask)
+    cm = ((fm + fore) > 0).astype(np.uint8)
+    cm = cv2.GaussianBlur(cm.astype(np.float32), (3, 3), 0)
+    cm = (cm > 0.5).astype(np.uint8)
     alpha = (cm * 255).astype(np.uint8)
     rgba  = np.dstack([arr, alpha])
     return Image.fromarray(rgba)
 def remove_face_using_segmentation(img: Image.Image) -> Image.Image:
+    """
+    Remove face+forehead: return RGBA with hair-only (alpha=255 hair, alpha=0 face).
+    """
     ff   = extract_face_and_forehead_no_hair(img)
+    mask = np.array(ff)[..., 3] > 0
     ori  = img.convert("RGBA")
     arr  = np.array(ori)
+    arr[..., 3][mask] = 0
     return Image.fromarray(arr)
+def get_bbox_from_alpha(rgba: Image.Image):
+    """
+    Compute bounding box from alpha channel: (x1, y1, x2, y2) or None.
+    """
+    arr = np.array(rgba)
+    alpha = arr[..., 3]
+    ys, xs = np.where(alpha > 0)
+    if ys.size == 0:
+        return None
+    x1, x2 = xs.min(), xs.max()
+    y1, y2 = ys.min(), ys.max()
+    return x1, y1, x2, y2
+def compute_scale(w_bg, h_bg, w_src, h_src):
+    return ((w_bg / w_src) + (h_bg / h_src)) / 2
+def compute_offset(bbox_bg, bbox_src, scale):
+    x1, y1, x2, y2 = bbox_bg
+    bg_cx = x1 + (x2 - x1) // 2
+    bg_cy = y1 + (y2 - y1) // 2
+    sx1, sy1, sx2, sy2 = bbox_src
+    src_cx = int((sx1 + (sx2 - sx1) // 2) * scale)
+    src_cy = int((sy1 + (sy2 - sy1) // 2) * scale)
+    return bg_cx - src_cx, bg_cy - src_cy
+def paste_with_alpha(bg: np.ndarray, src: np.ndarray, offset: tuple[int, int]) -> Image.Image:
+    res = bg.copy()
+    x, y = offset
+    h, w = src.shape[:2]
+    x1, y1 = max(x, 0), max(y, 0)
+    x2 = min(x + w, bg.shape[1])
+    y2 = min(y + h, bg.shape[0])
+    if x1 >= x2 or y1 >= y2:
+        return Image.fromarray(res)
+    cs = src[y1 - y:y2 - y, x1 - x:x2 - x]
+    cd = res[y1:y2, x1:x2]
+    mask = cs[..., 3] > 0
+    if cd.shape[2] == 3:
+        cd[mask] = cs[mask][..., :3]
+    else:
+        cd[mask] = cs[mask]
+    res[y1:y2, x1:x2] = cd
+    return Image.fromarray(res)