# -*- coding: utf-8 -*-wj """Version to be deployed of 3.2 Calculating area/perimeter Automatically generated by Colab. Original file is located at https://colab.research.google.com/drive/1XPeCoTBgWSNBYZ3aMKBteP4YG3w4bORs """ # pip install ezdxf[draw] # pip install --upgrade ezdxf # pip install pymupdf #==1.22.5 # pip install PyPDF2 # pip install ezdxf scipy """## Imports""" import numpy as np import cv2 from matplotlib import pyplot as plt import math from PIL import Image , ImageDraw, ImageFont , ImageColor import fitz import ezdxf as ez import sys from ezdxf import units from ezdxf.math import OCS, Matrix44, Vec3 import ezdxf import matplotlib.pyplot as plt from matplotlib.patches import Polygon from shapely.geometry import Polygon as ShapelyPolygon from ezdxf.math import Vec2 import random import pandas as pd import google_sheet_Legend import tsadropboxretrieval from ezdxf import bbox """## Notes""" #new approach to get width and height of dxf plan ''' This portion is used to convert vertices read from dxf to pixels in order to accurately locate shapes in the image and pdf ratio : MeasuredMetric* PixelValue/ DxfMetric = MeasuredPixel PixelValue: get from pixel conversion code , second number in the bracker represents the perimeter DxfMetric: measured perimeter from foxit divide pixelvalue by dxfmetric, will give u a ratio , this is ur dxfratio ''' """PDF to image""" def pdftoimg(datadoc): doc = fitz.open('pdf',datadoc) page=doc[0] pix = page.get_pixmap() # render page to an image pl=Image.frombytes('RGB', [pix.width,pix.height],pix.samples) img=np.array(pl) img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR) return img # Standard ISO paper sizes in inches ISO_SIZES_INCHES = { "A0": (33.11, 46.81), "A1": (23.39, 33.11), "A2": (16.54, 23.39), "A3": (11.69, 16.54), "A4": (8.27, 11.69), "A5": (5.83, 8.27), "A6": (4.13, 5.83), "A7": (2.91, 4.13), "A8": (2.05, 2.91), "A9": (1.46, 2.05), "A10": (1.02, 1.46) } def get_paper_size_in_inches(width, height): """Find the closest matching paper size in inches.""" for size, (w, h) in ISO_SIZES_INCHES.items(): if (abs(w - width) < 0.1 and abs(h - height) < 0.1) or (abs(w - height) < 0.1 and abs(h - width) < 0.1): return size return "Unknown Size" def analyze_pdf(datadoc): # Open the PDF file pdf_document = fitz.open('pdf',datadoc) # Iterate through pages and print their sizes for page_number in range(len(pdf_document)): page = pdf_document[page_number] rect = page.rect width_points, height_points = rect.width, rect.height # Convert points to inches width_inches, height_inches = width_points / 72, height_points / 72 paper_size = get_paper_size_in_inches(width_inches, height_inches) print(f"Page {page_number + 1}: {width_inches:.2f} x {height_inches:.2f} inches ({paper_size})") pdf_document.close() return width_inches , height_inches , paper_size def get_dxfSize(dxfpath): doc = ezdxf.readfile(dxfpath) msp = doc.modelspace() # Create a cache for bounding box calculations # Get the overall bounding box for all entities in the modelspace cache = bbox.Cache() overall_bbox = bbox.extents(msp, cache=cache) print("Overall Bounding Box:", overall_bbox) print(overall_bbox.extmin[0]+overall_bbox.extmax[0], overall_bbox.extmin[1]+overall_bbox.extmax[1]) return overall_bbox.extmin[0]+overall_bbox.extmax[0], overall_bbox.extmin[1]+overall_bbox.extmax[1] def switch_case(argument): switcher = { "A0": 1.27, "A1": 2.54, "A2": 5.08, "A3": 10.16, "A4": 20.32, "A5": 40.64, "A6": 81.28, "A7": 162.56, "A8": 325.12, "A9": 650.24, "A10": 1300.48 } # Get the value from the dictionary; if not found, return a default value print("Final Ratio=",switcher.get(argument, 1)) return switcher.get(argument, 1) def RetriveRatio(datadoc,dxfpath): width,height,paper_size = analyze_pdf (datadoc) if(width > height ): bigger=width else: bigger=height width_dxf,height_dxf = get_dxfSize(dxfpath) if(width_dxf > height_dxf ): bigger_dxf=width_dxf else: bigger_dxf=height_dxf if(0.2 < bigger_dxf/bigger < 1.2): print("bigger_dxf/bigger",bigger/bigger_dxf) argument = paper_size FinalRatio=switch_case(argument) else: FinalRatio=1 return FinalRatio """Flips image DXF origin is at the bottom left while img origin is top left """ def flip(img): height, width = img.shape[:2] # Define the rotation angle (clockwise) angle = 180 # Calculate the rotation matrix rotation_matrix = cv2.getRotationMatrix2D((width/2, height/2), angle, 1) # Rotate the image rotated_image = cv2.warpAffine(img, rotation_matrix, (width, height)) flipped_horizontal = cv2.flip(rotated_image, 1) return flipped_horizontal """### Hatched areas""" def get_hatched_areas(filename,FinalRatio): doc = ezdxf.readfile(filename) doc.header['$MEASUREMENT'] = 1 msp = doc.modelspace() trial=0 hatched_areas = [] for entity in msp: if entity.dxftype() == 'HATCH': flag=0 trial=0 print(entity.dxftype()) for path in entity.paths: if str(path.type)=='BoundaryPathType.POLYLINE': print('First type of Hatch') vertices = [(vertex[0]* (FinalRatio), vertex[1]* (FinalRatio))for vertex in path.vertices] if(len(vertices)>3): poly = ShapelyPolygon(vertices) minx, miny, maxx, maxy = poly.bounds # Calculate the width and height of the bounding box width = maxx - minx height = maxy - miny if (poly.area > 1.5 and (height > 0.7 and width > 0.7)): area1 = round(poly.area,3) perimeter = round (poly.length,3) if trial==0: hatched_areas.append([vertices,area1,perimeter]) trial=1 else: for i in range(len(hatched_areas)): if(area1 == hatched_areas[i][1]): flag=1 elif str(path.type) == 'BoundaryPathType.EDGE': print('Second type of Hatch') vert=[] flag=0 flag2=0 for edge in path.edges: x,y=edge.start x1,y1=edge.end if(flag==0): vert=[(x* (FinalRatio),y* (FinalRatio)),(x1* (FinalRatio),y1* (FinalRatio))] else: vert.append([x1* (FinalRatio),y1* (FinalRatio)]) flag=1 poly = ShapelyPolygon(vert) minx, miny, maxx, maxy = poly.bounds # Calculate the width and height of the bounding box width = maxx - minx height = maxy - miny if (poly.area > 1.5 and (height > 0.7 and width > 0.7)): area1= round(poly.area,3) perimeter = round (poly.length,3) for i in range(len(hatched_areas)): if(area1 == hatched_areas[i][1]): flag2=1 if(flag2==0): hatched_areas.append([vert,area1,perimeter]) else: print(path.type) elif entity.dxftype() == 'SOLID': vertices = [entity.dxf.vtx0 * (FinalRatio), entity.dxf.vtx1* (FinalRatio), entity.dxf.vtx2* (FinalRatio), entity.dxf.vtx3* (FinalRatio)] poly = ShapelyPolygon(vertices) minx, miny, maxx, maxy = poly.bounds # Calculate the width and height of the bounding box width = maxx - minx height = maxy - miny if (poly.area > 1.5 and (height > 0.7 and width > 0.7)): hatched_areas.append([vertices,poly.area,poly.length]) elif entity.dxftype() == 'LWPOLYLINE': vertices=[] lwpolyline = entity points = lwpolyline.get_points() flag=0 for i in range(len(points)): vertices.append([points[i][0]* (FinalRatio),points[i][1]* (FinalRatio)]) if(len(vertices)>3): if(vertices[0][0] == vertices[len(vertices)-1][0] or vertices[0][1] == vertices[len(vertices)-1][1]): poly=ShapelyPolygon(vertices) minx, miny, maxx, maxy = poly.bounds # Calculate the width and height of the bounding box width = maxx - minx height = maxy - miny if (poly.area > 1.5 and (height > 0.7 and width > 0.7)): area1 = round(poly.area,3) perimeter = round (poly.length,3) for i in range(len(hatched_areas)): if(area1 == hatched_areas[i][1]): flag=1 if(flag==0): hatched_areas.append([vertices,area1,perimeter]) elif entity.dxftype() == 'POLYLINE': flag=0 vertices = [(v.dxf.location.x * (FinalRatio), v.dxf.location.y * (FinalRatio)) for v in entity.vertices] print('Vertices:', vertices) if(len(vertices)>3): if(vertices[0][0] == vertices[len(vertices)-1][0] or vertices[0][1] == vertices[len(vertices)-1][1]): poly=ShapelyPolygon(vertices) minx, miny, maxx, maxy = poly.bounds # Calculate the width and height of the bounding box width = maxx - minx height = maxy - miny if (poly.area > 1.5 and (height > 0.7 and width > 0.7)): area1 = round(poly.area,3) perimeter = round (poly.length,3) for i in range(len(hatched_areas)): if(area1 == hatched_areas[i][1]): flag=1 if(flag==0): hatched_areas.append([vertices,area1,perimeter]) elif entity.dxftype() == 'SPLINE': spline_entity = entity vertices = [] control_points = spline_entity.control_points if(len(control_points)>3): for i in range(len(control_points)): vertices.append([control_points[i][0]* (FinalRatio),control_points[i][1]* (FinalRatio)]) poly=ShapelyPolygon(vertices) minx, miny, maxx, maxy = poly.bounds # Calculate the width and height of the bounding box width = maxx - minx height = maxy - miny if (poly.area > 1.5 and (height > 0.7 and width > 0.7)): area1 = round(poly.area,3) perimeter = round (poly.length,3) hatched_areas.append([vertices,area1,perimeter]) sorted_data = sorted(hatched_areas, key=lambda x: x[1]) return sorted_data """### Rotate polygon""" from math import sin, cos, radians def rotate_point(point, angle,pdfrotation,width,height, center_point=(0, 0)): """Rotates a point around center_point(origin by default) Angle is in degrees. Rotation is counter-clockwise """ angle_rad = radians(angle % 360) # Shift the point so that center_point becomes the origin new_point = (point[0] - center_point[0], point[1] - center_point[1]) new_point = (new_point[0] * cos(angle_rad) - new_point[1] * sin(angle_rad), new_point[0] * sin(angle_rad) + new_point[1] * cos(angle_rad)) # Reverse the shifting we have done if pdfrotation!=0: new_point = (new_point[0]+width + center_point[0], new_point[1] + center_point[1]) #pdfsize[2] is the same as +width else: new_point = (new_point[0] + center_point[0], new_point[1]+ height + center_point[1]) # pdfsize[3] is the same as +height # new_point = (new_point[0] + center_point[0], new_point[1] + center_point[1]) return new_point def rotate_polygon(polygon, angle, pdfrotation,width,height,center_point=(0, 0)): """Rotates the given polygon which consists of corners represented as (x,y) around center_point (origin by default) Rotation is counter-clockwise Angle is in degrees """ rotated_polygon = [] for corner in polygon: rotated_corner = rotate_point(corner, angle,pdfrotation,width,height, center_point) rotated_polygon.append(rotated_corner) return rotated_polygon #create a dataframe containing color , count(how many times is this object found in the plan), area of 1 of these shapes, total area #perimeter, totat perimeter, length, total length #import pandas as pd #SimilarAreaDictionary= pd.DataFrame(columns=['Guess','Color','Occurences','Area','Total Area','Perimeter','Total Perimeter','Length','Total Length','R','G','B']) #loop 3la hatched areas and count the occurences of each shape w create a table bl hagat di def generate_color_array(length): colorRanges = [] while len(colorRanges) < length: # Generate random RGB values r = random.randint(0, 255) g = random.randint(0, 255) b = random.randint(0, 255) # Ensure no duplicate colors if (r, g, b) not in colorRanges: colorRanges.append((r, g, b)) return colorRanges def Create_DF(dxfpath,datadoc): FinalRatio= RetriveRatio(datadoc,dxfpath) hatched_areas = get_hatched_areas(dxfpath,FinalRatio) # SimilarAreaDictionary= pd.DataFrame(columns=['Area', 'Total Area', 'Perimeter', 'Total Perimeter', 'Occurences', 'Color']) SimilarAreaDictionary= pd.DataFrame(columns=['Guess','Color','Occurences','Area','Total Area','Perimeter','Total Perimeter','Length','Total Length','Texts','Comments']) colorRanges2=generate_color_array(300) colorRanges = [[255, 0, 0], [0, 0, 255], [0, 255, 255], [0, 64, 0], [255, 204, 0], [255, 128, 64], [255, 0, 128], [255, 128, 192], [128, 128, 255], [128, 64, 0],[0, 255, 0],[0, 200, 0],[255, 128, 255], [128, 0, 255], [0, 128, 192], [128, 0, 128],[128, 0, 0], [0, 128, 255], [149, 1, 70], [255, 182, 128], [222, 48, 71], [240, 0, 112], [255, 0, 255], [192, 46, 65], [0, 0, 128],[0, 128, 64],[255, 255, 0], [128, 0, 80], [255, 255, 128], [90, 255, 140],[255, 200, 20],[91, 16, 51], [90, 105, 138], [114, 10, 138], [36, 82, 78], [225, 105, 190], [108, 150, 170], [11, 35, 75], [42, 176, 170], [255, 176, 170], [209, 151, 15],[81, 27, 85], [226, 106, 122], [67, 119, 149], [159, 179, 140], [159, 179, 30],[255, 85, 198], [255, 27, 85], [188, 158, 8],[140, 188, 120], [59, 61, 52], [65, 81, 21], [212, 255, 174], [15, 164, 90],[41, 217, 245], [213, 23, 182], [11, 85, 169], [78, 153, 239], [0, 66, 141],[64, 98, 232], [140, 112, 255], [57, 33, 154], [194, 117, 252], [116, 92, 135], [74, 43, 98], [188, 13, 123], [129, 58, 91], [255, 128, 100], [171, 122, 145], [255, 98, 98], [222, 48, 77]] colorUsed=[] TotalArea=0 TotalPerimeter=0 for i in range(len(hatched_areas)): area = hatched_areas[i][1] # area perimeter = hatched_areas[i][2] # perimeter if(i < len(colorRanges)): color = colorRanges[i] colorUsed.append(color) else: color = colorRanges2[i] colorUsed.append(color) TotalArea = area TotalPerimeter = perimeter tol=2 condition1 = (SimilarAreaDictionary['Area'] >= area - tol) & (SimilarAreaDictionary['Area'] <= area +tol) condition2 = (SimilarAreaDictionary['Perimeter'] >= perimeter -tol) & (SimilarAreaDictionary['Perimeter'] <= perimeter +tol) combined_condition = condition1 & condition2 if any(combined_condition): index = np.where(combined_condition)[0][0] SimilarAreaDictionary.at[index, 'Occurences'] += 1 SimilarAreaDictionary.at[index, 'Total Area'] = SimilarAreaDictionary.at[index, 'Total Area'] + area SimilarAreaDictionary.at[index, 'Total Perimeter'] = SimilarAreaDictionary.at[index, 'Total Perimeter'] + perimeter else: TotalArea=area TotalPerimeter=perimeter new_data = {'Area': area, 'Total Area': TotalArea ,'Perimeter': perimeter, 'Total Perimeter': TotalPerimeter, 'Occurences': 1, 'Color':color,'Comments':''} #add color here and read color to insert in SimilarAreaDictionary = pd.concat([SimilarAreaDictionary, pd.DataFrame([new_data])], ignore_index=True) # print(SimilarAreaDictionary) return SimilarAreaDictionary """### Draw on Image and PDF""" def mainFunctionDrawImgPdf(datadoc,dxfpath, dxfratio,pdfpath,pdfname): FinalRatio= RetriveRatio(datadoc,dxfpath) hatched_areas = get_hatched_areas(dxfpath,FinalRatio) img=pdftoimg(datadoc) flipped_horizontal=flip(img) allcnts = [] imgg = flipped_horizontal # imgtransparent1=imgg.copy() doc = fitz.open('pdf',datadoc) page2 = doc[0] rotationOld=page2.rotation derotationMatrix=page2.derotation_matrix pix=page2.get_pixmap() width=abs(page2.mediabox[2])+abs(page2.mediabox[0]) height=abs(page2.mediabox[3])+abs(page2.mediabox[1]) print('mediabox', width , height) if page2.rotation!=0: rotationangle = page2.rotation page2.set_rotation(0) ratio = pix.width/ img.shape[0] else: ratio = pix.width/ img.shape[1] rotationangle = 270 allshapes=[] # Iterate through each polygon in metric units NewColors = [] SimilarAreaDictionary=Create_DF(dxfpath,datadoc) i=0 for polygon in hatched_areas: cntPoints = [] cntPoints1 = [] shapee = [] # Convert each vertex from metric to pixel coordinates for vertex in polygon[0]: x = (vertex[0]) *dxfratio y = (vertex[1]) *dxfratio if rotationangle==0: if y<0: y=y*-1 cntPoints.append([int(x), int(y)]) cntPoints1.append([x, y]) for poi in np.array(cntPoints1): x1, y1 = poi p1 = fitz.Point(x1,y1) # p1 = fitz.Point(x1,y1) p1=p1*derotationMatrix shapee.append([p1[0],p1[1]]) shapee=np.flip(shapee,1) shapee=rotate_polygon(shapee,rotationangle,rotationOld,width,height) tol=2 condition1 = (SimilarAreaDictionary['Area'] >= polygon[1] - tol) & (SimilarAreaDictionary['Area'] <= polygon[1] +tol) condition2 = (SimilarAreaDictionary['Perimeter'] >= polygon[2] -tol) & (SimilarAreaDictionary['Perimeter'] <= polygon[2] +tol) combined_condition = condition1 & condition2 if any(combined_condition): index = np.where(combined_condition)[0][0] # print(SimilarAreaDictionary.at[index, 'Color']) NewColors=SimilarAreaDictionary.at[index, 'Color'] else: NewColors=SimilarAreaDictionary.at[i, 'Color'] # cv2.drawContours(imgg, [np.array(cntPoints)], -1, (NewColors), thickness=2) cv2.drawContours(imgg, [np.array(cntPoints)], -1, ([NewColors[2],NewColors[1],NewColors[0]]), thickness=-1) annot11 = page2.add_polygon_annot( points=shapee) # 'Polygon' annot11.set_border(width=0.2) annot11.set_colors(stroke=(int(NewColors[0])/255,int(NewColors[1])/255,int(NewColors[2])/255), fill= (int(NewColors[0])/255,int(NewColors[1])/255,int(NewColors[2])/255) ) annot11.set_info(content='Area='+str(polygon[1])+' m^2',subject='ADR Team') annot11.set_opacity(0.9) # annot.set_line_ends(fitz.PDF_ANNOT_LE_DIAMOND, fitz.PDF_ANNOT_LE_CIRCLE) annot11.update() annot12 = page2.add_polygon_annot( points=shapee) # 'Polygon' annot12.set_border(width=0.2) annot12.set_colors(stroke=(int(NewColors[0])/255,int(NewColors[1])/255,int(NewColors[2])/255)) annot12.set_info(content='Perimeter='+str(polygon[2])+' m',subject='ADR Team') annot12.set_opacity(0.8) # annot.set_line_ends(fitz.PDF_ANNOT_LE_DIAMOND, fitz.PDF_ANNOT_LE_CIRCLE) annot12.update() i += 1 alpha = 0.8 # Transparency factor. page2.set_rotation(rotationOld) Correct_img=flip(imgg) image_new1 = cv2.addWeighted(Correct_img, alpha, img, 1 - alpha, 0) SimilarAreaDictionary = SimilarAreaDictionary.fillna(' ') gc,spreadsheet_service,spreadsheetId, spreadsheet_url , namepathArr=google_sheet_Legend.legendGoogleSheets(SimilarAreaDictionary , pdfname,pdfpath) # dbxTeam=tsadropboxretrieval.ADR_Access_DropboxTeam('user') # md, res =dbxTeam.files_download(path= pdfpath+pdfname) # data = res.content # doc=fitz.open("pdf", data) # list1=pd.DataFrame(columns=['content', 'creationDate', 'id', 'modDate', 'name', 'subject', 'title']) list1=pd.DataFrame(columns=['content', 'id', 'subject','color']) for page in doc: # Iterate through annotations on the page for annot in page.annots(): # Get the color of the annotation annot_color = annot.colors if annot_color is not None: # annot_color is a dictionary with 'stroke' and 'fill' keys stroke_color = annot_color.get('stroke') # Border color fill_color = annot_color.get('fill') # Fill color if fill_color: v='fill' print('fill') if stroke_color: v='stroke' x,y,z=int(annot_color.get(v)[0]*255),int(annot_color.get(v)[1]*255),int(annot_color.get(v)[2]*255) list1.loc[len(list1)] =[annot.info['content'],annot.info['id'],annot.info['subject'],[x,y,z]] return doc,image_new1, SimilarAreaDictionary ,spreadsheetId, spreadsheet_url , namepathArr , list1,hatched_areas def deletemarkupsDXF(list1, dbPath, path): '''list1 : original markup pdf list2 : deleted markup pdf deletedrows : deleted markups - difference between both dfs ''' myDict1 = eval(list1) list1 = pd.DataFrame(myDict1) dbxTeam = tsadropboxretrieval.ADR_Access_DropboxTeam('user') md, res = dbxTeam.files_download(path=dbPath + path) data = res.content doc = fitz.open("pdf", data) # Prepare a DataFrame for the annotations in the new PDF list2 = pd.DataFrame(columns=['content', 'id', 'subject', 'color']) for page in doc: # Iterate through annotations on the page for annot in page.annots(): # Get the color of the annotation annot_color = annot.colors if annot_color is not None: # Check for fill or stroke color stroke_color = annot_color.get('stroke') fill_color = annot_color.get('fill') v = 'stroke' if stroke_color else 'fill' color = annot_color.get(v) if color: # Convert color to tuple and multiply by 255 to get RGB values color_tuple = (int(color[0] * 255), int(color[1] * 255), int(color[2] * 255)) # Append annotation data to list2 list2.loc[len(list2)] = [annot.info['content'], annot.info['id'], annot.info['subject'], color_tuple] # Ensure that colors are stored as tuples (which are hashable) list1['color'] = list1['color'].apply(lambda x: tuple(x) if isinstance(x, list) else x) # Find the deleted rows by checking the difference between original and current annotations deletedrows = pd.concat([list1, list2]).drop_duplicates(keep=False) print(deletedrows, len(deletedrows)) flag = 0 if len(deletedrows) != 0: flag = 1 deletedrows = deletedrows[['content', 'id', 'subject', 'color']] # Drop rows where 'content' starts with 'Scale' deletedrows = deletedrows.drop(deletedrows.index[deletedrows['content'].str.startswith('Scale')]) else: flag = 0 return deletedrows