Spaces:

AGLO-AI
/

raster2seq

Runtime error

raster2seq / data_preprocess /cubicasa5k /floorplan_extraction.py

anas

Initial deployment of Raster2Seq floor plan vectorization API

fadb92b about 2 months ago

16.5 kB

	import argparse
	import glob
	import json
	import os
	import sys
	from multiprocessing import Pool
	from pathlib import Path

	import cv2
	import numpy as np
	from shapely.geometry import Polygon
	from tqdm import tqdm

	sys.path.append(str(Path(__file__).resolve().parent.parent))
	from common_utils import resort_corners
	from create_coco_cc5k import create_coco_bounding_box

	from util.plot_utils import plot_semantic_rich_floorplan_opencv


	def plot_floor(output_coco_polygons, categories_dict, img_w, img_h, save_path, door_window_index=[10, 9]):
	gt_sem_rich = []
	for j, (poly, poly_type) in enumerate(output_coco_polygons):
	corners = np.array(poly).reshape(-1, 2).astype(np.int32)
	# corners_flip_y = corners.copy()
	# corners_flip_y[:,1] = 255 - corners_flip_y[:,1]
	# corners = corners_flip_y
	gt_sem_rich.append([corners, poly_type])
	# plot_semantic_rich_floorplan_nicely(gt_sem_rich, save_path, prec=None, rec=None,
	# plot_text=True, is_bw=False,
	# door_window_index=door_window_index,
	# img_w=img_w,
	# img_h=img_h,
	# semantics_label_mapping=get_dataset_class_labels(categories_dict),
	# )
	plot_semantic_rich_floorplan_opencv(
	gt_sem_rich,
	save_path,
	img_w=img_w,
	img_h=img_h,
	door_window_index=door_window_index,
	semantics_label_mapping=get_dataset_class_labels(categories_dict),
	is_bw=False,
	)


	def prepare_dict(categories_dict):
	save_dict = {"images": [], "annotations": [], "categories": categories_dict}
	return save_dict


	def extract_polygons_from_mask(binary_mask, output_mask_path):
	"""
	Extract polygons from a binary mask where regions with value 1 are polygons
	and background regions have value 0.

	Args:
	binary_mask (numpy.ndarray): Binary mask with shape (H, W), where 1 represents
	the polygon regions and 0 represents the background.

	Returns:
	list: A list of polygons, where each polygon is represented as a list of (x, y) coordinates.
	"""
	# Ensure the mask is binary (0 and 1)
	binary_mask = (binary_mask > 0).astype(np.uint8)

	# Find contours in the binary mask
	contours, _ = cv2.findContours(binary_mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)

	# Extract polygons from contours
	polygons = []
	for contour in contours:
	# Approximate the contour to reduce the number of points
	epsilon = 0.001 * cv2.arcLength(contour, True) # Adjust epsilon for more/less detail
	approx_polygon = cv2.approxPolyDP(contour, epsilon, True)
	polygons.append(approx_polygon.squeeze().tolist()) # Convert to list of (x, y) points

	# Convert binary_mask to a 3-channel image to draw colored polylines
	binary_mask_colored = cv2.cvtColor(binary_mask * 255, cv2.COLOR_GRAY2BGR)

	# Plot polygons on the binary mask with green color
	for polygon in polygons:
	points = np.array(polygon, dtype=np.int32)
	cv2.polylines(binary_mask_colored, [points], isClosed=True, color=(0, 0, 255), thickness=10)

	cv2.imwrite(output_mask_path, binary_mask_colored)

	return polygons


	def read_polygons_from_json(json_file):
	with open(json_file, "r") as f:
	data = json.load(f)
	category_dict = data["categories"]
	polygons = [data["annotations"][i]["segmentation"][0] for i in range(len(data["annotations"]))]
	poly_types = [data["annotations"][i]["category_id"] for i in range(len(data["annotations"]))]
	source_misc = [data["annotations"][i] for i in range(len(data["annotations"]))]
	source_polygons = [(polygons[i], poly_types[i]) for i in range(len(polygons))]

	return source_polygons, source_misc, category_dict


	def get_dataset_class_labels(category_dict):
	return {category_dict[i]["id"]: category_dict[i]["name"] for i in range(len(category_dict))}


	def check_all_window_door_inside(polygons, door_window_index):
	flag = all([poly_type in door_window_index for _, poly_type in polygons])
	return flag


	def extract_region_and_annotation(
	source_image,
	source_annot_path,
	region_polygons,
	start_image_id,
	output_image_dir="output",
	output_annot_dir="annotations",
	output_aux_dir="output_aux",
	vis_aux=True,
	):
	"""
	Extract regions of the floorplan from the source image based on polygons
	and generate annotations.

	Args:
	source_image (numpy.ndarray): The source image (H, W, 3).
	polygons (list): List of polygons, where each polygon is a list of (x, y) coordinates.
	output_dir (str): Directory to save the extracted regions and annotations.

	Returns:
	list: A list of annotations for each extracted region.
	"""
	door_window_index = [10, 9]
	source_polygons, source_misc, categories_dict = read_polygons_from_json(source_annot_path)
	source_img_id = os.path.basename(source_annot_path).split(".")[0].zfill(5)
	if vis_aux:
	gt_sem_rich_path = os.path.join(output_aux_dir, "{}_org_floor.png".format(source_img_id))
	plot_floor(
	source_polygons,
	categories_dict,
	source_image.shape[1],
	source_image.shape[0],
	gt_sem_rich_path,
	door_window_index=door_window_index,
	)
	margin = 10
	img_id = start_image_id

	# each region polygon corresponds to an image
	for i, polygon in enumerate(region_polygons):
	instance_id = 0
	output_coco_polygons = []
	# Create a mask for the current polygon
	mask = np.zeros(source_image.shape[:2], dtype=np.uint8)
	points = np.array(polygon, dtype=np.int32)
	cv2.fillPoly(mask, [points], 255)

	# Crop the ROI to the bounding box of the polygon
	x, y, w, h = cv2.boundingRect(points)
	# Expand the bounding box by the margin
	x_expanded = max(x - margin, 0)
	y_expanded = max(y - margin, 0)
	w_expanded = min(x + w + margin, source_image.shape[1]) - x_expanded
	h_expanded = min(y + h + margin, source_image.shape[0]) - y_expanded

	x, y, w, h = x_expanded, y_expanded, w_expanded, h_expanded
	cropped_roi = source_image[y : y + h, x : x + w]

	save_dict = prepare_dict(categories_dict)

	# Create an annotation for the extracted region
	img_dict = {}
	img_dict["file_name"] = f"{str(img_id).zfill(5)}_{source_img_id}.png"
	img_dict["id"] = img_id
	img_dict["width"] = w
	img_dict["height"] = h

	# Save the cropped ROI
	roi_filename = f"{output_image_dir}/{str(img_id).zfill(5)}_{source_img_id}.png"
	cv2.imwrite(roi_filename, cropped_roi)

	bounding_box = np.array([x, y, x + w, y + h])

	# Convert source polygons to NumPy arrays for vectorized operations
	source_polygons_np = [np.array(src_poly[0]).reshape(-1, 2) for src_poly in source_polygons]
	assert len(source_polygons_np) == len(source_polygons)

	coco_annotation_dict_list = []
	# Iterate through the polygons and filter those inside the bounding box
	for j, tmp in enumerate(source_polygons_np):
	# Compute the bounding box of the current polygon
	poly_bbox = np.hstack([np.min(tmp, axis=0), np.max(tmp, axis=0)])

	# Check if the polygon is outside the bounding box
	if np.any(poly_bbox[:2] < bounding_box[:2]) or np.any(poly_bbox[2:] > bounding_box[2:]):
	continue

	# Scale the polygon coordinates relative to the top-left corner of the bounding box
	scaled_polygon = tmp - bounding_box[:2]

	coco_seg_poly = []
	poly_sorted = resort_corners(scaled_polygon)
	# image = draw_polygon_on_image(image, poly_shapely, "test_poly.jpg")

	for p in poly_sorted:
	coco_seg_poly += list(p)

	if len(scaled_polygon) == 2:
	area = source_misc[j]["area"]
	coco_bb = source_misc[j]["bbox"]
	# shift the bounding box
	coco_bb[0] -= bounding_box[0]
	coco_bb[1] -= bounding_box[1]
	else:
	poly_shapely = Polygon(scaled_polygon)
	area = poly_shapely.area
	rectangle_shapely = poly_shapely.envelope

	# Slightly wider bounding box
	bb_x, bb_y = rectangle_shapely.exterior.xy
	coco_bb = create_coco_bounding_box(bb_x, bb_y, w, h, bound_pad=2)

	coco_annotation_dict = {
	"segmentation": [coco_seg_poly],
	"area": area,
	"iscrowd": 0,
	"image_id": img_id,
	"bbox": coco_bb,
	"category_id": source_polygons[j][1],
	"id": instance_id,
	}
	coco_annotation_dict_list.append(coco_annotation_dict)
	output_coco_polygons.append([coco_seg_poly, source_polygons[j][1]])

	# Remove after obtaining the polygon
	# source_polygons.pop(j)
	# source_misc.pop(j)
	instance_id += 1

	# skip if just windows and doors are inside
	if check_all_window_door_inside(output_coco_polygons, door_window_index):
	instance_id -= len(coco_annotation_dict_list)
	continue

	save_dict["images"].append(img_dict)
	save_dict["annotations"] += coco_annotation_dict_list

	if vis_aux:
	gt_sem_rich_path = os.path.join(
	output_aux_dir, "{}_{}_floor.png".format(str(img_id).zfill(5), source_img_id)
	)
	plot_floor(
	output_coco_polygons, categories_dict, w, h, gt_sem_rich_path, door_window_index=door_window_index
	)

	# Save annotations to a JSON file
	json_path = f"{output_annot_dir}/{str(img_id).zfill(5)}_{source_img_id}.json"
	with open(json_path, "w") as f:
	json.dump(save_dict, f)

	img_id += 1

	start_image_id = img_id

	return start_image_id


	def config():
	a = argparse.ArgumentParser(description="Generate coco format data for Structured3D")
	a.add_argument(
	"--data_root", default="Structured3D_panorama", type=str, help="path to raw Structured3D_panorama folder"
	)
	a.add_argument("--output", default="coco_cubicasa5k", type=str, help="path to output folder")

	args = a.parse_args()
	return args


	# Example usage
	if __name__ == "__main__":
	args = config()

	### prepare
	outFolder = args.output
	if not os.path.exists(outFolder):
	os.mkdir(outFolder)

	annotation_outFolder = os.path.join(outFolder, "annotations_json")
	if not os.path.exists(annotation_outFolder):
	os.mkdir(annotation_outFolder)

	annos_train_folder = os.path.join(annotation_outFolder, "train")
	annos_val_folder = os.path.join(annotation_outFolder, "val")
	annos_test_folder = os.path.join(annotation_outFolder, "test")
	os.makedirs(annos_train_folder, exist_ok=True)
	os.makedirs(annos_val_folder, exist_ok=True)
	os.makedirs(annos_test_folder, exist_ok=True)

	train_img_folder = os.path.join(outFolder, "train")
	val_img_folder = os.path.join(outFolder, "val")
	test_img_folder = os.path.join(outFolder, "test")

	for img_folder in [train_img_folder, val_img_folder, test_img_folder]:
	if not os.path.exists(img_folder):
	os.mkdir(img_folder)

	### begin processing
	start_image_id = 3500
	save_folders = [train_img_folder, val_img_folder, test_img_folder]
	annos_folders = [annos_train_folder, annos_val_folder, annos_test_folder]
	splits = ["train", "val", "test"]

	def wrapper(index):
	image_path, annot_path, mask_path = packed_input_files[index]
	cur_image_id = int(os.path.basename(image_path).split(".")[0])
	binary_mask = cv2.imread(mask_path)[:, :, -1]
	source_image = cv2.imread(image_path, cv2.IMREAD_COLOR)
	# Extract polygons
	region_polygons = extract_polygons_from_mask(
	binary_mask, output_mask_path=f"{save_aux_path}/{str(cur_image_id).zfill(5)}_polylines.png"
	)

	return extract_region_and_annotation(
	source_image,
	annot_path,
	region_polygons,
	start_image_id + index * 10,
	save_path,
	save_anno_path,
	save_aux_path,
	vis_aux=True,
	)

	def worker_init(input_files_object):
	# Store dataset as global to avoid pickling issues
	global packed_input_files
	packed_input_files = input_files_object

	for i, split in enumerate(splits):
	image_files = sorted(glob.glob(f"{args.data_root}/{split}/*.png"))
	image_id_list = [os.path.basename(image_path).split(".")[0] for image_path in image_files]
	anno_files = [f"{args.data_root}/annotations_json/{split}/{id_}.json" for id_ in image_id_list]
	mask_files = [f"{args.data_root}/{split}_aux/{id_}_mask.png" for id_ in image_id_list]
	save_path = save_folders[i]
	save_anno_path = annos_folders[i]
	save_aux_path = save_path.rstrip("/") + "_aux"
	os.makedirs(save_aux_path, exist_ok=True)

	# for j, (image_path, anno_path, mask_path) in enumerate(zip(image_files, anno_files, mask_files)):
	# cur_image_id = int(os.path.basename(image_path).split('.')[0])
	# binary_mask = cv2.imread(mask_path)[:,:,-1]
	# source_image = cv2.imread(image_path, cv2.IMREAD_COLOR)

	# # Extract polygons
	# polygons = extract_polygons_from_mask(binary_mask, output_mask_path=f'{save_aux_path}/{str(cur_image_id).zfill(5)}_polylines.png')
	# # # skip if only one polygon (floorplan)
	# # if len(polygons) == 1:
	# # print(f"Skipping {image_path} with only one polygon")
	# # with open(anno_path, 'r') as f:
	# # data = json.load(f)
	# # # update image id
	# # data['images'][0]['id'] = start_image_id
	# # data['images'][0]["file_name"] = f'{str(start_image_id).zfill(5)}_{str(cur_image_id).zfill(5)}.png'
	# # for anno in data['annotations']:
	# # anno['image_id'] = start_image_id

	# # with open(f"{save_anno_path}/{str(start_image_id).zfill(5)}_{str(cur_image_id).zfill(5)}.json", 'w') as f:
	# # json.dump(data, f, indent=2)
	# # shutil.copy(image_path, f"{save_path}/{str(start_image_id).zfill(5)}_{str(cur_image_id).zfill(5)}.png")

	# # gt_sem_rich_path = os.path.join(save_aux_path, '{}_{}_floor.png'.format(str(start_image_id).zfill(5), str(cur_image_id).zfill(5)))
	# # output_coco_polygons = [(x['segmentation'][0], x['category_id']) for x in data['annotations']]
	# # plot_floor(output_coco_polygons, data['categories'], data['images'][0]['width'], data['images'][0]['height'], gt_sem_rich_path, door_window_index=[10, 9])

	# # start_image_id += 1
	# # continue

	# # # Print the extracted polygons
	# # print("Extracted polygons:")
	# # for i, polygon in enumerate(polygons):
	# # print(f"Polygon {i + 1}: {polygon}")

	# start_image_id = extract_region_and_annotation(source_image,
	# anno_path,
	# polygons,
	# start_image_id,
	# output_image_dir=save_path,
	# output_annot_dir=save_anno_path,
	# output_aux_dir=save_aux_path,
	# vis_aux=True)

	packed_input_files = list(zip(image_files, anno_files, mask_files))
	# for j in range(5):
	# wrapper(j)
	# exit(0)

	num_processes = 16
	with Pool(num_processes, initializer=worker_init, initargs=(packed_input_files,)) as p:
	indices = [j for j in range(len(packed_input_files))]
	list(tqdm(p.imap(wrapper, indices), total=len(indices)))

	start_image_id += len(packed_input_files) * 10