Spaces:

SohomToom
/

ComicFileToCleanedZip

Sleeping

App Files Files Community

ComicFileToCleanedZip / app.py

SohomToom

Upload 2 files

31dacfa verified 10 months ago

raw

history blame

5.12 kB

	import os
	import shutil
	import tempfile
	import cv2
	import numpy as np
	import gradio as gr
	import zipfile
	import patoolib
	import threading
	from paddleocr import PaddleOCR
	from PIL import Image

	def delayed_cleanup(path, delay=30):
	def cleanup():
	import time
	time.sleep(delay)
	try:
	if os.path.isdir(path):
	shutil.rmtree(path)
	elif os.path.exists(path):
	os.remove(path)
	except Exception as e:
	print(f"Cleanup failed: {e}")
	threading.Thread(target=cleanup).start()

	ocr = PaddleOCR(use_angle_cls=True, lang='en', det_model_dir='models/det', rec_model_dir='models/rec', cls_model_dir='models/cls')

	def classify_background_color(avg_color, white_thresh=230, black_thresh=50, yellow_thresh=100):
	r, g, b = avg_color
	if r >= white_thresh and g >= white_thresh and b >= white_thresh:
	return (255, 255, 255)
	if r <= black_thresh and g <= black_thresh and b <= black_thresh:
	return (0, 0, 0)
	if r >= yellow_thresh and g >= yellow_thresh and b < yellow_thresh:
	return (255, 255, 0)
	return None

	def sample_border_color(image, box, padding=2):
	h, w = image.shape[:2]
	x_min, y_min, x_max, y_max = box
	x_min = max(0, x_min - padding)
	x_max = min(w-1, x_max + padding)
	y_min = max(0, y_min - padding)
	y_max = min(h-1, y_max + padding)

	top = image[y_min:y_min+padding, x_min:x_max]
	bottom = image[y_max-padding:y_max, x_min:x_max]
	left = image[y_min:y_max, x_min:x_min+padding]
	right = image[y_min:y_max, x_max-padding:x_max]

	border_pixels = np.vstack((top.reshape(-1, 3), bottom.reshape(-1, 3),
	left.reshape(-1, 3), right.reshape(-1, 3)))
	if border_pixels.size == 0:
	return (255, 255, 255)
	median_color = np.median(border_pixels, axis=0)
	return tuple(map(int, median_color))

	def detect_text_boxes(image):
	results = ocr.ocr(image, cls=True)
	if not results or not results[0]:
	return []
	boxes = []
	for line in results[0]:
	box, (text, confidence) = line
	if text.strip():
	x_min = int(min(pt[0] for pt in box))
	x_max = int(max(pt[0] for pt in box))
	y_min = int(min(pt[1] for pt in box))
	y_max = int(max(pt[1] for pt in box))
	boxes.append(((x_min, y_min, x_max, y_max), text, confidence))
	return boxes

	def remove_text_dynamic_fill(img_path, output_path):
	image = cv2.imread(img_path)
	if image is None:
	return
	if len(image.shape) == 2 or image.shape[2] == 1:
	image = cv2.cvtColor(image, cv2.COLOR_GRAY2RGB)
	else:
	image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)

	boxes = detect_text_boxes(image)

	for (bbox, text, confidence) in boxes:
	if confidence < 0.4 or not text.strip():
	continue
	x_min, y_min, x_max, y_max = bbox
	height = y_max - y_min
	padding = 2 if height <= 30 else 4 if height <= 60 else 6
	x_min_p = max(0, x_min - padding)
	y_min_p = max(0, y_min - padding)
	x_max_p = min(image.shape[1]-1, x_max + padding)
	y_max_p = min(image.shape[0]-1, y_max + padding)
	sample_crop = image[y_min_p:y_max_p, x_min_p:x_max_p]
	avg_color = np.mean(sample_crop.reshape(-1, 3), axis=0)
	fill_color = classify_background_color(avg_color)
	if fill_color is None:
	fill_color = sample_border_color(image, (x_min, y_min, x_max, y_max))
	cv2.rectangle(image, (x_min_p, y_min_p), (x_max_p, y_max_p), fill_color, -1)

	image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
	cv2.imwrite(output_path, image)

	def extract_comic_archive(archive_path, extract_to):
	if archive_path.endswith(".cbz"):
	with zipfile.ZipFile(archive_path, 'r') as zip_ref:
	zip_ref.extractall(extract_to)
	elif archive_path.endswith(".cbr"):
	patoolib.extract_archive(archive_path, outdir=extract_to)

	def process_cbz_cbr(file):
	temp_input = tempfile.mkdtemp()
	temp_output = tempfile.mkdtemp()
	extract_comic_archive(file.name, temp_input)
	for root, _, files in os.walk(temp_input):
	for fname in files:
	if fname.lower().endswith((".jpg", ".jpeg", ".png")):
	src = os.path.join(root, fname)
	dst = os.path.join(temp_output, fname)
	remove_text_dynamic_fill(src, dst)
	zip_path = shutil.make_archive(temp_output, 'zip', temp_output)
	delayed_cleanup(temp_input)
	delayed_cleanup(temp_output)
	delayed_cleanup(zip_path)
	return zip_path

	demo = gr.Interface(
	fn=process_cbz_cbr,
	inputs=gr.File(file_types=[".cbz", ".cbr"], label="Upload Comic Archive (.cbz or .cbr)"),
	outputs=gr.File(label="Download Cleaned Zip"),
	title="Comic Text Cleaner (.cbz/.cbr)",
	description="Upload a .cbz or .cbr file and get a zip of cleaned comic images (text removed using PaddleOCR)."
	)

	demo.launch()