Spaces:

VanKee
/

InteractiveImageMosaicGenerator

Sleeping

App Files Files Community

VanKee commited on Sep 22, 2025

Commit

bdaf195

1 Parent(s): ce54710

update logic to no longer resize image.

Browse files

Files changed (18) hide show

.gitignore +2 -0
out/{mosaic_avg_32.png → cells_outline_3378.png} +2 -2
out/cells_outline_5090.png +3 -0
out/cells_outline_akaza.png +3 -0
out/{mosaic_palette_16_32.png → mosaic_adaptive_3378.png} +2 -2
out/mosaic_adaptive_5090.png +3 -0
out/mosaic_adaptive_akaza.png +3 -0
out/mosaic_cifar_adaptive_3378.png +3 -0
out/mosaic_cifar_adaptive_3378_10.png +3 -0
out/mosaic_cifar_adaptive_3378_100.png +3 -0
out/mosaic_cifar_adaptive_5090.png +3 -0
out/mosaic_cifar_adaptive_5090_10.png +3 -0
out/mosaic_cifar_adaptive_5090_100.png +3 -0
out/mosaic_cifar_adaptive_akaza_10.png +3 -0
out/mosaic_cifar_adaptive_akaza_100.png +3 -0
samples/akaza.jpg +3 -0
simple_mosaic.py +140 -23
tile_library.py +64 -0

.gitignore CHANGED Viewed

	@@ -1,2 +1,4 @@
1
2	.DS_Store

 .DS_Store
+cifar_data/
+__pycache__/

out/{mosaic_avg_32.png → cells_outline_3378.png} RENAMED Viewed

File without changes

out/cells_outline_5090.png ADDED Viewed

Git LFS Details

SHA256: 7b13de0f565f58704f48fc0e05ed728b61ff1f2a3be438253a7a8a2bb0411be5
Pointer size: 131 Bytes
Size of remote file: 161 kB

out/cells_outline_akaza.png ADDED Viewed

Git LFS Details

SHA256: bef9261c5396cce35fe33d0fc83f05b2287bcb45003b1491fcb8f4906ac2502a
Pointer size: 131 Bytes
Size of remote file: 352 kB

out/{mosaic_palette_16_32.png → mosaic_adaptive_3378.png} RENAMED Viewed

File without changes

out/mosaic_adaptive_5090.png ADDED Viewed

Git LFS Details

SHA256: 8185b3ea84980ce519603127538ae9ed6764cbd3a66df4a4eb17dc89228ee750
Pointer size: 130 Bytes
Size of remote file: 38.1 kB

out/mosaic_adaptive_akaza.png ADDED Viewed

Git LFS Details

SHA256: 67376de8f1ce3e78ff9ae37fdf033030cdccfd3928a6c3c73969538c54910f62
Pointer size: 131 Bytes
Size of remote file: 287 kB

out/mosaic_cifar_adaptive_3378.png ADDED Viewed

Git LFS Details

SHA256: 4816c74054bbf3172cb794991c1ad9c69ef96d2bfc18dbc9f5c15424113193bd
Pointer size: 131 Bytes
Size of remote file: 230 kB

out/mosaic_cifar_adaptive_3378_10.png ADDED Viewed

Git LFS Details

SHA256: 4816c74054bbf3172cb794991c1ad9c69ef96d2bfc18dbc9f5c15424113193bd
Pointer size: 131 Bytes
Size of remote file: 230 kB

out/mosaic_cifar_adaptive_3378_100.png ADDED Viewed

Git LFS Details

SHA256: 24c1e7b0d2e572ba503970a021714552452530564762da2bb31d7f03454592a1
Pointer size: 131 Bytes
Size of remote file: 275 kB

out/mosaic_cifar_adaptive_5090.png ADDED Viewed

Git LFS Details

SHA256: d74d8aaca6ad7cf7b2bbbc03b65229b4593393c0de9451102e50a0a78b70e641
Pointer size: 131 Bytes
Size of remote file: 252 kB

out/mosaic_cifar_adaptive_5090_10.png ADDED Viewed

Git LFS Details

SHA256: d0d687aebb9ed858d757ce18633e83a998b9c14be42a4440d7b2f8fe3235df4e
Pointer size: 131 Bytes
Size of remote file: 242 kB

out/mosaic_cifar_adaptive_5090_100.png ADDED Viewed

Git LFS Details

SHA256: bb62c46edc3f3c0597149b3043596a25cde5696fe47261a327c8de5942ac1f33
Pointer size: 131 Bytes
Size of remote file: 340 kB

out/mosaic_cifar_adaptive_akaza_10.png ADDED Viewed

Git LFS Details

SHA256: 0badc6ca8764f2919e1b505af8017d3f876d6a20f4b4e37a08ae1996c98e3d97
Pointer size: 132 Bytes
Size of remote file: 2.15 MB

out/mosaic_cifar_adaptive_akaza_100.png ADDED Viewed

Git LFS Details

SHA256: 3fa6a00da729013522c1b0d944367183f21969319a696e7b6777313786f155ca
Pointer size: 132 Bytes
Size of remote file: 2.65 MB

samples/akaza.jpg ADDED Viewed

Git LFS Details

SHA256: ae2799f75879022947f6346c97460d857671f729aa059d4c8f8fd9111bf5bc50
Pointer size: 131 Bytes
Size of remote file: 336 kB

simple_mosaic.py CHANGED Viewed

@@ -2,7 +2,8 @@
 from pathlib import Path
 from typing import List, Tuple, Iterator
 import numpy as np
-from PIL import Image
 class SimpleMosaicImage:
     def __init__(self, path: str):
@@ -22,13 +23,29 @@ class SimpleMosaicImage:
             print(f"[INFO] Resized to {new_w}x{new_h}")
         return self
     def crop_to_grid(self, grid_size: int = 32) -> "SimpleMosaicImage":
         new_w = (self.width // grid_size) * grid_size
         new_h = (self.height // grid_size) * grid_size
-        if new_w != self.width or new_h != self.height:
             self.img = self.img.crop((0, 0, new_w, new_h))
             self.width, self.height = new_w, new_h
-            print(f"[INFO] Cropped to {new_w}x{new_h} for grid {grid_size}")
         return self
     def _as_array(self):
@@ -38,7 +55,20 @@ class SimpleMosaicImage:
         for y in range(0, self.height, grid_size):
             for x in range(0, self.width, grid_size):
                 yield (x, y, grid_size, grid_size)
     @staticmethod
     def _cell_mean(arr, x, y, w, h):
         block = arr[y:y+h, x:x+w, :]
@@ -53,23 +83,99 @@ class SimpleMosaicImage:
         dist2 = np.sum(diff*diff, axis=1)
         idx = int(np.argmin(dist2))
         return tuple(int(v) for v in pal[idx])
-    def mosaic_average_color(self, grid_size: int = 32):
         arr = self._as_array()
         out = np.empty_like(arr)
-        for (x, y, w, h) in self.iter_cells(grid_size):
             color = self._cell_mean(arr, x, y, w, h)
             out[y:y+h, x:x+w, :] = color
         return Image.fromarray(out, mode="RGB")
-    def mosaic_with_palette(self, grid_size: int, palette: List[Tuple[int,int,int]]):
         arr = self._as_array()
-        out = np.empty_like(arr)
-        for (x, y, w, h) in self.iter_cells(grid_size):
-            avg = self._cell_mean(arr, x, y, w, h)
-            color = self._nearest_color(avg, palette)
-            out[y:y+h, x:x+w, :] = color
-        return Image.fromarray(out, mode="RGB")
     def save(self, image: Image.Image, out_path: str) -> None:
         Path(out_path).parent.mkdir(parents=True, exist_ok=True)
@@ -77,16 +183,27 @@ class SimpleMosaicImage:
         print(f"[INFO] Saved: {out_path}")
-PALETTE_16 = [
-    (0,0,0), (255,255,255), (255,0,0), (0,255,0), (0,0,255),
-    (255,255,0), (255,0,255), (0,255,255),
-    (128,128,128), (128,0,0), (0,128,0), (0,0,128),
-    (128,128,0), (128,0,128), (0,128,128), (200,200,200)
-]
-loader = SimpleMosaicImage("./samples/IMG_5090.jpg")
-loader.resize(longest_side=512).crop_to_grid(grid_size=2)
-mosaic = loader.mosaic_average_color(grid_size=2)
-loader.save(mosaic, "./out/mosaic_avg_32.png")

 from pathlib import Path
 from typing import List, Tuple, Iterator
 import numpy as np
+from PIL import Image, ImageDraw
+from tile_library import build_cifar10_tile_library, build_cifar100_tile_library
 class SimpleMosaicImage:
     def __init__(self, path: str):
             print(f"[INFO] Resized to {new_w}x{new_h}")
         return self
+    def quantize_colors(self, n_colors: int = 16) -> "SimpleMosaicImage":
+        """Apply color quantization using PIL's built-in algorithm"""
+        quantized = self.img.quantize(colors=n_colors, method=Image.MEDIANCUT)
+        self.img = quantized.convert('RGB')
+        print(f"[INFO] Color quantized to {n_colors} colors")
+        return self
     def crop_to_grid(self, grid_size: int = 32) -> "SimpleMosaicImage":
+        """Smart boundary handling: preserve original size when possible"""
+        # Only crop if loss is minimal (<2%), otherwise preserve original size
         new_w = (self.width // grid_size) * grid_size
         new_h = (self.height // grid_size) * grid_size
+        lost_pixels = (self.width - new_w) + (self.height - new_h)
+        total_pixels = self.width + self.height
+        loss_ratio = lost_pixels / total_pixels
+        if loss_ratio < 0.02:  # Only crop if loss < 2%
             self.img = self.img.crop((0, 0, new_w, new_h))
             self.width, self.height = new_w, new_h
+            print(f"[INFO] Cropped to {new_w}x{new_h} for grid {grid_size} (loss: {loss_ratio:.1%})")
+        else:
+            print(f"[INFO] Preserved original size {self.width}x{self.height} (would lose {loss_ratio:.1%})")
         return self
     def _as_array(self):
         for y in range(0, self.height, grid_size):
             for x in range(0, self.width, grid_size):
                 yield (x, y, grid_size, grid_size)
+    def draw_cells(self, cells, outline=(255, 0, 0), width=0.1):
+        """
+        Draw cell borders on the original image, returns a new image.
+        outline: border color
+        width: border line width
+        """
+        canvas = self.img.copy()
+        draw = ImageDraw.Draw(canvas)
+        for (x, y, w, h) in cells:
+            # PIL rectangle bottom-right is inclusive, -1 to avoid overflow
+            draw.rectangle((x, y, x + w - 1, y + h - 1), outline=outline, width=width)
+        return canvas
     @staticmethod
     def _cell_mean(arr, x, y, w, h):
         block = arr[y:y+h, x:x+w, :]
         dist2 = np.sum(diff*diff, axis=1)
         idx = int(np.argmin(dist2))
         return tuple(int(v) for v in pal[idx])
+    def build_adaptive_cells(
+        self,
+        start_size: int = 64,
+        min_size: int = 16,
+        threshold: float = 20.0,     # Use grayscale variance as complexity measure
+        ) -> list[tuple[int,int,int,int]]:
+        """
+        Returns [(x,y,w,h), ...]: Quadtree-style adaptive grid using iterative stack.
+        Requirement: Image should be resized/cropped to be divisible by start_size for better alignment.
+        """
+        arr = self._as_array()
+        # Grayscale (BT.601)
+        gray = (0.299*arr[...,0] + 0.587*arr[...,1] + 0.114*arr[...,2]).astype(np.float32)
+        cells: list[tuple[int,int,int,int]] = []
+        # First rough division by start_size, push large blocks to stack
+        stack: list[tuple[int,int,int,int]] = []
+        for yy in range(0, self.height, start_size):
+            for xx in range(0, self.width, start_size):
+                ww = min(start_size, self.width  - xx)
+                hh = min(start_size, self.height - yy)
+                stack.append((xx, yy, ww, hh))
+        # Process stack: decide whether to keep or subdivide into 4 blocks
+        while stack:
+            x, y, w, h = stack.pop()
+            # Keep if reached minimum size
+            if w <= min_size or h <= min_size:
+                cells.append((x, y, w, h))
+                continue
+            # Complexity: grayscale variance
+            region = gray[y:y+h, x:x+w]
+            score = float(region.var())
+            # Below threshold -> keep without subdivision
+            if score < threshold:
+                cells.append((x, y, w, h))
+                continue
+            # Otherwise subdivide into 4 blocks (try to halve), handle boundary remainder
+            w2 = max(min_size, w // 2)
+            h2 = max(min_size, h // 2)
+            # Fallback: keep if cannot subdivide further (avoid infinite loop)
+            if w2 == w and h2 == h:
+                cells.append((x, y, w, h))
+                continue
+            # Top-left
+            stack.append((x, y, w2, h2))
+            # Top-right
+            x2 = x + w2
+            wR = min(w - w2, self.width - x2)
+            if wR > 0:
+                stack.append((x2, y, wR, h2))
+            # Bottom-left
+            y2 = y + h2
+            hB = min(h - h2, self.height - y2)
+            if hB > 0:
+                stack.append((x, y2, w2, hB))
+            # Bottom-right
+            if wR > 0 and hB > 0:
+                stack.append((x2, y2, wR, hB))
+        return cells
+    def mosaic_average_color_adaptive(self, cells):
         arr = self._as_array()
         out = np.empty_like(arr)
+        for (x, y, w, h) in cells:
             color = self._cell_mean(arr, x, y, w, h)
             out[y:y+h, x:x+w, :] = color
         return Image.fromarray(out, mode="RGB")
+    def mosaic_with_tiles_adaptive(self, cells, tiles, tile_means: np.ndarray):
+        """
+        Adaptive grid version: pass in cells from build_adaptive_cells.
+        """
+        out_img = Image.new("RGB", (self.width, self.height))
         arr = self._as_array()
+        means = tile_means.astype(np.float32)
+        for (x, y, w, h) in cells:
+            block_mean = np.array(self._cell_mean(arr, x, y, w, h), dtype=np.float32)
+            diff = means - block_mean[None, :]
+            idx = int(np.argmin(np.sum(diff*diff, axis=1)))
+            tile = tiles[idx].resize((w, h), Image.BILINEAR)
+            out_img.paste(tile, (x, y))
+        return out_img
     def save(self, image: Image.Image, out_path: str) -> None:
         Path(out_path).parent.mkdir(parents=True, exist_ok=True)
         print(f"[INFO] Saved: {out_path}")
+loader = SimpleMosaicImage("./samples/akaza.jpg")
+loader.quantize_colors(16).crop_to_grid(2)
+cells = loader.build_adaptive_cells(
+    start_size=64,  # Initial block size
+    min_size=4,    # Minimum block size
+    threshold=5.0  # Lower value = more subdivision
+)
+tiles_10, tile_means_10, tile_labels_10 = build_cifar10_tile_library(max_per_class=1000)
+tiles_100, tile_means_100, tile_labels_100 = build_cifar100_tile_library(max_per_class=400)
+vis1 = loader.draw_cells(cells, outline=(0, 255, 0), width=1)
+vis1.save("./out/cells_outline_akaza.png")
+mosaic_adapt = loader.mosaic_average_color_adaptive(cells)
+loader.save(mosaic_adapt, "./out/mosaic_adaptive_akaza.png")
+mosaic_tiles_adapt_10 = loader.mosaic_with_tiles_adaptive(cells, tiles=tiles_10, tile_means=tile_means_10)
+loader.save(mosaic_tiles_adapt_10, "./out/mosaic_cifar_adaptive_akaza_10.png")
+mosaic_tiles_adapt_100 = loader.mosaic_with_tiles_adaptive(cells, tiles=tiles_100, tile_means=tile_means_100)
+loader.save(mosaic_tiles_adapt_100, "./out/mosaic_cifar_adaptive_akaza_100.png")

tile_library.py ADDED Viewed

	@@ -0,0 +1,64 @@

+"""
+Tile library
+"""
+import numpy as np
+from PIL import Image
+from torchvision import datasets, transforms
+def build_cifar10_tile_library(root="./cifar_data", max_per_class=500):
+    """
+    Download/load CIFAR-10 training set as tile library.
+    For speed control, defaults to max_per_class tiles per class (10 classes, total <= 10*max_per_class).
+    Returns:
+      tiles:   List[PIL.Image], original 32x32
+      means:   np.ndarray [N,3], RGB average color of each tile (0..255)
+      labels:  np.ndarray [N], class labels (0..9)
+    """
+    ds = datasets.CIFAR10(root=root, train=True, download=True,
+                          transform=transforms.ToTensor())
+    counts = {c : 0 for c in range(10)}
+    tiles, means, labels = [], [], []
+    for img_tensor, lab in ds:
+        if counts[lab] >= max_per_class:
+            continue
+        arr= (img_tensor.numpy().transpose(1,2,0) * 255).astype(np.uint8)
+        pil = Image.fromarray(arr, mode="RGB")
+        tiles.append(pil)
+        means.append(arr.reshape(-1,3).mean(axis=0))
+        labels.append(lab)
+        counts[lab]+=1
+    means = np.asarray(means, dtype=np.float32)
+    labels = np.asarray(labels, dtype=np.int64)
+    print(f"[INFO] CIFAR10 tiles: {len(tiles)} (each 32x32). Per-class cap={max_per_class}")
+    return tiles, means, labels
+def build_cifar100_tile_library(root="./cifar_data", max_per_class=500):
+    """
+    Download/load CIFAR-100 training set as tile library.
+    For speed control, defaults to max_per_class tiles per class (100 classes, total <= 100*max_per_class).
+    Returns:
+      tiles:   List[PIL.Image], original 32x32
+      means:   np.ndarray [N,3], RGB average color of each tile (0..255)
+      labels:  np.ndarray [N], class labels (0..99)
+    """
+    ds = datasets.CIFAR100(root=root, train=True, download=True,
+                          transform=transforms.ToTensor())
+    counts = {c : 0 for c in range(100)}
+    tiles, means, labels = [], [], []
+    for img_tensor, lab in ds:
+        if counts[lab] >= max_per_class:
+            continue
+        arr= (img_tensor.numpy().transpose(1,2,0) * 255).astype(np.uint8)
+        pil = Image.fromarray(arr, mode="RGB")
+        tiles.append(pil)
+        means.append(arr.reshape(-1,3).mean(axis=0))
+        labels.append(lab)
+        counts[lab]+=1
+    means = np.asarray(means, dtype=np.float32)
+    labels = np.asarray(labels, dtype=np.int64)
+    print(f"[INFO] CIFAR10 tiles: {len(tiles)} (each 32x32). Per-class cap={max_per_class}")
+    return tiles, means, labels