Spaces:

Astridkraft
/

Stable-ControlNet-GPU

Paused

App Files Files Community

Astridkraft commited on Jan 4

Commit

5eb4d07

verified ·

1 Parent(s): 9940b7d

Update sam_module.py

Browse files

Files changed (1) hide show

sam_module.py +67 -15

sam_module.py CHANGED Viewed

@@ -853,6 +853,18 @@ def create_sam_mask(self, image, bbox_coords, mode):
                 print(f"       • Konfidenz-Score: {confidence_score:.3f}")
                 print(f"       • GESAMTSCORE: {score:.3f}")
                 # ============================================================
                 # THRESHOLD-BESTIMMUNG
@@ -870,6 +882,32 @@ def create_sam_mask(self, image, bbox_coords, mode):
                 print(f"   🎯 Gesichts-Threshold: {dynamic_threshold:.3f}")
                 # ============================================================
                 #        POSTPROCESSING
                 # ============================================================
@@ -939,10 +977,23 @@ def create_sam_mask(self, image, bbox_coords, mode):
                 # ABSCHLIESSENDE STATISTIK
                 # ============================================================
                 original_face_area = original_bbox_size[0] * original_bbox_size[1]
                 coverage_ratio = white_pixels / original_face_area if original_face_area > 0 else 0
                 print(f"   👤 GESICHTSABDECKUNG: {coverage_ratio:.1%} der ursprünglichen BBox")
                 # Warnungen basierend auf Abdeckung
                 if coverage_ratio < 0.7:
                     print(f"   ⚠️  WARNUNG: Geringe Gesichtsabdeckung ({coverage_ratio:.1%})")
@@ -951,29 +1002,30 @@ def create_sam_mask(self, image, bbox_coords, mode):
                 elif 0.8 <= coverage_ratio <= 1.2:
                     print(f"   ✅ OPTIMALE Gesichtsabdeckung ({coverage_ratio:.1%})")
                 # Zurück zu PIL Image
                 mask = Image.fromarray(mask_array).convert("L")
-                raw_mask = Image.fromarray(raw_mask_array).convert("L")
                 print("#" * 80)
                 print(f"✅ SAM 2 SEGMENTIERUNG ABGESCHLOSSEN")
                 print(f"📐 Finale Maskengröße: {mask.size}")
                 print(f"🎛️  Verwendeter Modus: {mode}")
-                # ============================================================
-                # FINALE AUSGABE FÜR GESICHTSMODUS
-                # ============================================================
-               if crop_size is not None:
-                   print(f"👤 Bei face_only_change: Crop={crop_size}×{crop_size}px, Heuristik-Score={best_score:.3f}")
-                   print(f"👤 Kopfabdeckung: {coverage_ratio:.1%} der BBox")
-            print(f"   DEBUG NACHHER - Min/Max: {mask_array.min()}/{mask_array.max()}, Typ: {mask_array.dtype}")
-            print("#" * 80)
-            return mask, raw_mask
         # ============================================================
         # UNBEKANNTER MODUS
         # ============================================================

                 print(f"       • Konfidenz-Score: {confidence_score:.3f}")
                 print(f"       • GESAMTSCORE: {score:.3f}")
+                if score > best_score:
+                    best_score = score
+                    best_mask_idx = i
+                    print(f"     🏆 Neue beste Maske: Nr. {i+1} mit Score {score:.3f}")
+            print(f"✅ Beste Maske ausgewählt: Nr. {best_mask_idx+1} mit Score {best_score:.3f}")
+            # Beste Maske verwenden
+            mask_np = all_masks[best_mask_idx]
+            max_val = mask_np.max()
+            print(f"🔍 Maximaler SAM-Konfidenzwert der besten Maske: {max_val:.3f}")
                 # ============================================================
                 # THRESHOLD-BESTIMMUNG
                 print(f"   🎯 Gesichts-Threshold: {dynamic_threshold:.3f}")
+                # Binärmaske erstellen
+                print("🐛 DEBUG THRESHOLD:")
+                print(f"   mask_np Min/Max: {mask_np.min():.3f}/{mask_np.max():.3f}")
+                print(f"   dynamic_threshold: {dynamic_threshold:.3f}")
+                mask_array = (mask_np > dynamic_threshold).astype(np.uint8) * 255
+                print(f"🚨 DEBUG BINÄRMASKE:")
+                print(f"   mask_array Min/Max: {mask_array.min()}/{mask_array.max()}")
+                print(f"   Weiße Pixel in mask_array: {np.sum(mask_array > 0)}")
+                print(f"   Anteil weiße Pixel: {np.sum(mask_array > 0) / mask_array.size:.1%}")
+                # Fallback wenn Maske leer
+                if mask_array.max() == 0:
+                    print("⚠️  KRITISCH: Binärmaske ist leer! Erzwinge Testmaske (BBox).")
+                    print(f"   🚨 BBox für Fallback: x1={x1}, y1={y1}, x2={x2}, y2={y2}")
+                test_mask = np.zeros((image.height, image.width), dtype=np.uint8)
+                cv2.rectangle(test_mask, (x1, y1), (x2, y2), 255, -1)
+                mask_array = test_mask
+                print(f"🐛 DEBUG ERZWUNGENE MASKE: Weiße Pixel: {np.sum(mask_array > 0)}")
+                # Rohmaske speichern
+                raw_mask_array = mask_array.copy()
                 # ============================================================
                 #        POSTPROCESSING
                 # ============================================================
                 # ABSCHLIESSENDE STATISTIK
                 # ============================================================
+                print("📊 FINALE MASKEN-STATISTIK")
+                # Weiße Pixel zählen
+                white_pixels = np.sum(mask_array > 0)
+                total_pixels = mask_array.size
+                white_ratio = white_pixels / total_pixels * 100
+                # Original-BBox Fläche (vor Crop)
                 original_face_area = original_bbox_size[0] * original_bbox_size[1]
                 coverage_ratio = white_pixels / original_face_area if original_face_area > 0 else 0
                 print(f"   👤 GESICHTSABDECKUNG: {coverage_ratio:.1%} der ursprünglichen BBox")
+                print(f"   Weiße Pixel (Veränderungsbereich): {white_pixels:,} ({white_ratio:.1f}%)")
+                print(f"   Schwarze Pixel (Erhaltungsbereich): {total_pixels-white_pixels:,} ({100-white_ratio:.1f}%)")
+                print(f"   Gesamtpixel: {total_pixels:,}")
+                print(f"   👤 GESICHTSABDECKUNG: {coverage_ratio:.1%} der ursprünglichen BBox")
                 # Warnungen basierend auf Abdeckung
                 if coverage_ratio < 0.7:
                     print(f"   ⚠️  WARNUNG: Geringe Gesichtsabdeckung ({coverage_ratio:.1%})")
                 elif 0.8 <= coverage_ratio <= 1.2:
                     print(f"   ✅ OPTIMALE Gesichtsabdeckung ({coverage_ratio:.1%})")
+                #===============
                 # Zurück zu PIL Image
                 mask = Image.fromarray(mask_array).convert("L")
+                raw_mask = Image.fromarray(raw_mask_array).convert("L")
                 print("#" * 80)
                 print(f"✅ SAM 2 SEGMENTIERUNG ABGESCHLOSSEN")
                 print(f"📐 Finale Maskengröße: {mask.size}")
                 print(f"🎛️  Verwendeter Modus: {mode}")
+                print(f"👤 Crop={crop_size}×{crop_size}px, Heuristik-Score={best_score:.3f}")
+                print(f"👤 Kopfabdeckung: {coverage_ratio:.1%} der BBox")
+                print(f"🔍 DEBUG FINALE MASKE:")
+                print(f"   mask_array Min/Max: {mask_array.min()}/{mask_array.max()}, Typ: {mask_array.dtype}")
+                print(f"   Weiße Pixel final: {np.sum(mask_array > 0)}")
+                print("#" * 80)
+                return mask, raw_mask
         # ============================================================
         # UNBEKANNTER MODUS
         # ============================================================