|
|
import warnings |
|
|
import cv2 |
|
|
import numpy as np |
|
|
from PIL import Image |
|
|
from custom_controlnet_aux.util import HWC3, resize_image_with_pad |
|
|
|
|
|
class BinaryDetector: |
|
|
def __call__(self, input_image=None, bin_threshold=0, detect_resolution=512, output_type=None, upscale_method="INTER_CUBIC", **kwargs): |
|
|
if "img" in kwargs: |
|
|
warnings.warn("img is deprecated, please use `input_image=...` instead.", DeprecationWarning) |
|
|
input_image = kwargs.pop("img") |
|
|
|
|
|
if input_image is None: |
|
|
raise ValueError("input_image must be defined.") |
|
|
|
|
|
if not isinstance(input_image, np.ndarray): |
|
|
input_image = np.array(input_image, dtype=np.uint8) |
|
|
output_type = output_type or "pil" |
|
|
else: |
|
|
output_type = output_type or "np" |
|
|
|
|
|
detected_map, remove_pad = resize_image_with_pad(input_image, detect_resolution, upscale_method) |
|
|
|
|
|
img_gray = cv2.cvtColor(detected_map, cv2.COLOR_RGB2GRAY) |
|
|
if bin_threshold == 0 or bin_threshold == 255: |
|
|
|
|
|
otsu_threshold, img_bin = cv2.threshold(img_gray, 0, 255, cv2.THRESH_BINARY_INV + cv2.THRESH_OTSU) |
|
|
print("Otsu threshold:", otsu_threshold) |
|
|
else: |
|
|
_, img_bin = cv2.threshold(img_gray, bin_threshold, 255, cv2.THRESH_BINARY_INV) |
|
|
|
|
|
detected_map = cv2.cvtColor(img_bin, cv2.COLOR_GRAY2RGB) |
|
|
detected_map = HWC3(remove_pad(255 - detected_map)) |
|
|
|
|
|
if output_type == "pil": |
|
|
detected_map = Image.fromarray(detected_map) |
|
|
|
|
|
return detected_map |
|
|
|