MeasurementTesting

Sleeping

App Files Files Community

MeasurementTesting / dxf__omar3_2.py

Marthee

Update dxf__omar3_2.py

b425674 verified over 1 year ago

raw

history blame contribute delete

23.8 kB

	# -- coding: utf-8 --wj
	"""Version to be deployed of 3.2 Calculating area/perimeter

	Automatically generated by Colab.

	Original file is located at
	https://colab.research.google.com/drive/1XPeCoTBgWSNBYZ3aMKBteP4YG3w4bORs
	"""

	# pip install ezdxf[draw]

	# pip install --upgrade ezdxf

	# pip install pymupdf #==1.22.5

	# pip install PyPDF2

	# pip install ezdxf scipy

	"""## Imports"""

	import numpy as np
	import cv2
	from matplotlib import pyplot as plt
	import math
	from PIL import Image , ImageDraw, ImageFont , ImageColor
	import fitz
	import ezdxf as ez
	import sys
	from ezdxf import units
	from ezdxf.math import OCS, Matrix44, Vec3
	import ezdxf
	import matplotlib.pyplot as plt
	from matplotlib.patches import Polygon
	from shapely.geometry import Polygon as ShapelyPolygon
	from ezdxf.math import Vec2
	import random
	import pandas as pd
	import google_sheet_Legend
	import tsadropboxretrieval
	from ezdxf import bbox

	"""## Notes"""

	#new approach to get width and height of dxf plan
	'''
	This portion is used to convert vertices read from dxf to pixels in order to accurately locate shapes in the image and pdf
	ratio :
	MeasuredMetric* PixelValue/ DxfMetric = MeasuredPixel
	PixelValue: get from pixel conversion code , second number in the bracker represents the perimeter
	DxfMetric: measured perimeter from foxit

	divide pixelvalue by dxfmetric, will give u a ratio , this is ur dxfratio


	'''


	"""PDF to image"""

	def pdftoimg(datadoc):
	doc = fitz.open('pdf',datadoc)
	page=doc[0]
	pix = page.get_pixmap() # render page to an image
	pl=Image.frombytes('RGB', [pix.width,pix.height],pix.samples)
	img=np.array(pl)
	img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
	return img


	# Standard ISO paper sizes in inches
	ISO_SIZES_INCHES = {
	"A0": (33.11, 46.81),
	"A1": (23.39, 33.11),
	"A2": (16.54, 23.39),
	"A3": (11.69, 16.54),
	"A4": (8.27, 11.69),
	"A5": (5.83, 8.27),
	"A6": (4.13, 5.83),
	"A7": (2.91, 4.13),
	"A8": (2.05, 2.91),
	"A9": (1.46, 2.05),
	"A10": (1.02, 1.46)
	}

	def get_paper_size_in_inches(width, height):
	"""Find the closest matching paper size in inches."""
	for size, (w, h) in ISO_SIZES_INCHES.items():
	if (abs(w - width) < 0.1 and abs(h - height) < 0.1) or (abs(w - height) < 0.1 and abs(h - width) < 0.1):
	return size
	return "Unknown Size"

	def analyze_pdf(datadoc):
	# Open the PDF file
	pdf_document = fitz.open('pdf',datadoc)

	# Iterate through pages and print their sizes
	for page_number in range(len(pdf_document)):
	page = pdf_document[page_number]
	rect = page.rect
	width_points, height_points = rect.width, rect.height

	# Convert points to inches
	width_inches, height_inches = width_points / 72, height_points / 72

	paper_size = get_paper_size_in_inches(width_inches, height_inches)

	print(f"Page {page_number + 1}: {width_inches:.2f} x {height_inches:.2f} inches ({paper_size})")

	pdf_document.close()
	return width_inches , height_inches , paper_size


	def get_dxfSize(dxfpath):

	doc = ezdxf.readfile(dxfpath)
	msp = doc.modelspace()
	# Create a cache for bounding box calculations
	# Get the overall bounding box for all entities in the modelspace
	cache = bbox.Cache()
	overall_bbox = bbox.extents(msp, cache=cache)
	print("Overall Bounding Box:", overall_bbox)
	print(overall_bbox.extmin[0]+overall_bbox.extmax[0], overall_bbox.extmin[1]+overall_bbox.extmax[1])

	return overall_bbox.extmin[0]+overall_bbox.extmax[0], overall_bbox.extmin[1]+overall_bbox.extmax[1]



	def switch_case(argument):
	switcher = {
	"A0": 1.27,
	"A1": 2.54,
	"A2": 5.08,
	"A3": 10.16,
	"A4": 20.32,
	"A5": 40.64,
	"A6": 81.28,
	"A7": 162.56,
	"A8": 325.12,
	"A9": 650.24,
	"A10": 1300.48
	}
	# Get the value from the dictionary; if not found, return a default value
	print("Final Ratio=",switcher.get(argument, 1))
	return switcher.get(argument, 1)




	def RetriveRatio(datadoc,dxfpath):

	width,height,paper_size = analyze_pdf (datadoc)

	if(width > height ):
	bigger=width
	else:
	bigger=height

	width_dxf,height_dxf = get_dxfSize(dxfpath)

	if(width_dxf > height_dxf ):
	bigger_dxf=width_dxf
	else:
	bigger_dxf=height_dxf

	if(0.2 < bigger_dxf/bigger < 1.2):
	print("bigger_dxf/bigger",bigger/bigger_dxf)
	argument = paper_size
	FinalRatio=switch_case(argument)
	else:
	FinalRatio=1
	return FinalRatio


	"""Flips image
	DXF origin is at the bottom left while img origin is top left
	"""

	def flip(img):
	height, width = img.shape[:2]

	# Define the rotation angle (clockwise)
	angle = 180

	# Calculate the rotation matrix
	rotation_matrix = cv2.getRotationMatrix2D((width/2, height/2), angle, 1)

	# Rotate the image
	rotated_image = cv2.warpAffine(img, rotation_matrix, (width, height))
	flipped_horizontal = cv2.flip(rotated_image, 1)
	return flipped_horizontal

	"""### Hatched areas"""

	def get_hatched_areas(filename,FinalRatio):
	doc = ezdxf.readfile(filename)
	doc.header['$MEASUREMENT'] = 1
	msp = doc.modelspace()
	trial=0
	hatched_areas = []

	for entity in msp:

	if entity.dxftype() == 'HATCH':
	flag=0
	trial=0

	print(entity.dxftype())

	for path in entity.paths:
	if str(path.type)=='BoundaryPathType.POLYLINE':
	print('First type of Hatch')
	vertices = [(vertex[0]* (FinalRatio), vertex[1]* (FinalRatio))for vertex in path.vertices]
	if(len(vertices)>3):
	poly = ShapelyPolygon(vertices)

	minx, miny, maxx, maxy = poly.bounds

	# Calculate the width and height of the bounding box
	width = maxx - minx
	height = maxy - miny



	if (poly.area > 1.5 and (height > 0.7 and width > 0.7)):
	area1 = round(poly.area,3)
	perimeter = round (poly.length,3)
	if trial==0:
	hatched_areas.append([vertices,area1,perimeter])
	trial=1
	else:
	for i in range(len(hatched_areas)):
	if(area1 == hatched_areas[i][1]):
	flag=1
	elif str(path.type) == 'BoundaryPathType.EDGE':
	print('Second type of Hatch')

	vert=[]
	flag=0
	flag2=0
	for edge in path.edges:
	x,y=edge.start
	x1,y1=edge.end
	if(flag==0):
	vert=[(x* (FinalRatio),y* (FinalRatio)),(x1* (FinalRatio),y1* (FinalRatio))]
	else:
	vert.append([x1* (FinalRatio),y1* (FinalRatio)])
	flag=1
	poly = ShapelyPolygon(vert)
	minx, miny, maxx, maxy = poly.bounds

	# Calculate the width and height of the bounding box
	width = maxx - minx
	height = maxy - miny

	if (poly.area > 1.5 and (height > 0.7 and width > 0.7)):
	area1= round(poly.area,3)
	perimeter = round (poly.length,3)
	for i in range(len(hatched_areas)):
	if(area1 == hatched_areas[i][1]):
	flag2=1
	if(flag2==0):
	hatched_areas.append([vert,area1,perimeter])
	else:
	print(path.type)

	elif entity.dxftype() == 'SOLID':
	vertices = [entity.dxf.vtx0 * (FinalRatio), entity.dxf.vtx1* (FinalRatio), entity.dxf.vtx2* (FinalRatio), entity.dxf.vtx3* (FinalRatio)]
	poly = ShapelyPolygon(vertices)
	minx, miny, maxx, maxy = poly.bounds

	# Calculate the width and height of the bounding box
	width = maxx - minx
	height = maxy - miny

	if (poly.area > 1.5 and (height > 0.7 and width > 0.7)):
	hatched_areas.append([vertices,poly.area,poly.length])

	elif entity.dxftype() == 'LWPOLYLINE':

	vertices=[]
	lwpolyline = entity
	points = lwpolyline.get_points()
	flag=0

	for i in range(len(points)):
	vertices.append([points[i][0]* (FinalRatio),points[i][1]* (FinalRatio)])
	if(len(vertices)>3):

	if(vertices[0][0] == vertices[len(vertices)-1][0] or vertices[0][1] == vertices[len(vertices)-1][1]):

	poly=ShapelyPolygon(vertices)
	minx, miny, maxx, maxy = poly.bounds

	# Calculate the width and height of the bounding box
	width = maxx - minx
	height = maxy - miny

	if (poly.area > 1.5 and (height > 0.7 and width > 0.7)):
	area1 = round(poly.area,3)
	perimeter = round (poly.length,3)
	for i in range(len(hatched_areas)):
	if(area1 == hatched_areas[i][1]):
	flag=1
	if(flag==0):
	hatched_areas.append([vertices,area1,perimeter])


	elif entity.dxftype() == 'POLYLINE':

	flag=0
	vertices = [(v.dxf.location.x * (FinalRatio), v.dxf.location.y * (FinalRatio)) for v in entity.vertices]
	print('Vertices:', vertices)

	if(len(vertices)>3):

	if(vertices[0][0] == vertices[len(vertices)-1][0] or vertices[0][1] == vertices[len(vertices)-1][1]):

	poly=ShapelyPolygon(vertices)
	minx, miny, maxx, maxy = poly.bounds

	# Calculate the width and height of the bounding box
	width = maxx - minx
	height = maxy - miny

	if (poly.area > 1.5 and (height > 0.7 and width > 0.7)):
	area1 = round(poly.area,3)
	perimeter = round (poly.length,3)
	for i in range(len(hatched_areas)):
	if(area1 == hatched_areas[i][1]):
	flag=1
	if(flag==0):
	hatched_areas.append([vertices,area1,perimeter])

	elif entity.dxftype() == 'SPLINE':
	spline_entity = entity
	vertices = []
	control_points = spline_entity.control_points
	if(len(control_points)>3):
	for i in range(len(control_points)):
	vertices.append([control_points[i][0]* (FinalRatio),control_points[i][1]* (FinalRatio)])
	poly=ShapelyPolygon(vertices)

	minx, miny, maxx, maxy = poly.bounds

	# Calculate the width and height of the bounding box
	width = maxx - minx
	height = maxy - miny


	if (poly.area > 1.5 and (height > 0.7 and width > 0.7)):
	area1 = round(poly.area,3)
	perimeter = round (poly.length,3)
	hatched_areas.append([vertices,area1,perimeter])

	sorted_data = sorted(hatched_areas, key=lambda x: x[1])
	return sorted_data

	"""### Rotate polygon"""

	from math import sin, cos, radians

	def rotate_point(point, angle,pdfrotation,width,height, center_point=(0, 0)):
	"""Rotates a point around center_point(origin by default)
	Angle is in degrees.
	Rotation is counter-clockwise
	"""
	angle_rad = radians(angle % 360)
	# Shift the point so that center_point becomes the origin
	new_point = (point[0] - center_point[0], point[1] - center_point[1])
	new_point = (new_point[0] * cos(angle_rad) - new_point[1] * sin(angle_rad),
	new_point[0] * sin(angle_rad) + new_point[1] * cos(angle_rad))
	# Reverse the shifting we have done
	if pdfrotation!=0:

	new_point = (new_point[0]+width + center_point[0], new_point[1] + center_point[1]) #pdfsize[2] is the same as +width
	else:

	new_point = (new_point[0] + center_point[0], new_point[1]+ height + center_point[1]) # pdfsize[3] is the same as +height
	# new_point = (new_point[0] + center_point[0], new_point[1] + center_point[1])
	return new_point


	def rotate_polygon(polygon, angle, pdfrotation,width,height,center_point=(0, 0)):
	"""Rotates the given polygon which consists of corners represented as (x,y)
	around center_point (origin by default)
	Rotation is counter-clockwise
	Angle is in degrees
	"""
	rotated_polygon = []
	for corner in polygon:
	rotated_corner = rotate_point(corner, angle,pdfrotation,width,height, center_point)
	rotated_polygon.append(rotated_corner)
	return rotated_polygon

	#create a dataframe containing color , count(how many times is this object found in the plan), area of 1 of these shapes, total area
	#perimeter, totat perimeter, length, total length
	#import pandas as pd
	#SimilarAreaDictionary= pd.DataFrame(columns=['Guess','Color','Occurences','Area','Total Area','Perimeter','Total Perimeter','Length','Total Length','R','G','B'])
	#loop 3la hatched areas and count the occurences of each shape w create a table bl hagat di

	def generate_color_array(length):
	colorRanges = []
	while len(colorRanges) < length:
	# Generate random RGB values
	r = random.randint(0, 255)
	g = random.randint(0, 255)
	b = random.randint(0, 255)
	# Ensure no duplicate colors
	if (r, g, b) not in colorRanges:
	colorRanges.append((r, g, b))
	return colorRanges

	def Create_DF(dxfpath,datadoc):

	FinalRatio= RetriveRatio(datadoc,dxfpath)

	hatched_areas = get_hatched_areas(dxfpath,FinalRatio)
	# SimilarAreaDictionary= pd.DataFrame(columns=['Area', 'Total Area', 'Perimeter', 'Total Perimeter', 'Occurences', 'Color'])
	SimilarAreaDictionary= pd.DataFrame(columns=['Guess','Color','Occurences','Area','Total Area','Perimeter','Total Perimeter','Length','Total Length','Texts','Comments'])

	colorRanges2=generate_color_array(300)
	colorRanges = [[255, 0, 0], [0, 0, 255], [0, 255, 255], [0, 64, 0], [255, 204, 0], [255, 128, 64], [255, 0, 128], [255, 128, 192], [128, 128, 255], [128, 64, 0],[0, 255, 0],[0, 200, 0],[255, 128, 255], [128, 0, 255], [0, 128, 192], [128, 0, 128],[128, 0, 0], [0, 128, 255], [149, 1, 70], [255, 182, 128], [222, 48, 71], [240, 0, 112], [255, 0, 255], [192, 46, 65], [0, 0, 128],[0, 128, 64],[255, 255, 0], [128, 0, 80], [255, 255, 128], [90, 255, 140],[255, 200, 20],[91, 16, 51], [90, 105, 138], [114, 10, 138], [36, 82, 78], [225, 105, 190], [108, 150, 170], [11, 35, 75], [42, 176, 170], [255, 176, 170], [209, 151, 15],[81, 27, 85], [226, 106, 122], [67, 119, 149], [159, 179, 140], [159, 179, 30],[255, 85, 198], [255, 27, 85], [188, 158, 8],[140, 188, 120], [59, 61, 52], [65, 81, 21], [212, 255, 174], [15, 164, 90],[41, 217, 245], [213, 23, 182], [11, 85, 169], [78, 153, 239], [0, 66, 141],[64, 98, 232], [140, 112, 255], [57, 33, 154], [194, 117, 252], [116, 92, 135], [74, 43, 98], [188, 13, 123], [129, 58, 91], [255, 128, 100], [171, 122, 145], [255, 98, 98], [222, 48, 77]]
	colorUsed=[]
	TotalArea=0
	TotalPerimeter=0
	for i in range(len(hatched_areas)):
	area = hatched_areas[i][1] # area
	perimeter = hatched_areas[i][2] # perimeter
	if(i < len(colorRanges)):
	color = colorRanges[i]
	colorUsed.append(color)
	else:
	color = colorRanges2[i]
	colorUsed.append(color)
	TotalArea = area
	TotalPerimeter = perimeter
	tol=2
	condition1 = (SimilarAreaDictionary['Area'] >= area - tol) & (SimilarAreaDictionary['Area'] <= area +tol)
	condition2 = (SimilarAreaDictionary['Perimeter'] >= perimeter -tol) & (SimilarAreaDictionary['Perimeter'] <= perimeter +tol)
	combined_condition = condition1 & condition2

	if any(combined_condition):
	index = np.where(combined_condition)[0][0]
	SimilarAreaDictionary.at[index, 'Occurences'] += 1
	SimilarAreaDictionary.at[index, 'Total Area'] = SimilarAreaDictionary.at[index, 'Total Area'] + area
	SimilarAreaDictionary.at[index, 'Total Perimeter'] = SimilarAreaDictionary.at[index, 'Total Perimeter'] + perimeter
	else:
	TotalArea=area
	TotalPerimeter=perimeter
	new_data = {'Area': area, 'Total Area': TotalArea ,'Perimeter': perimeter, 'Total Perimeter': TotalPerimeter, 'Occurences': 1, 'Color':color,'Comments':''} #add color here and read color to insert in
	SimilarAreaDictionary = pd.concat([SimilarAreaDictionary, pd.DataFrame([new_data])], ignore_index=True)

	# print(SimilarAreaDictionary)
	return SimilarAreaDictionary
	"""### Draw on Image and PDF"""

	def mainFunctionDrawImgPdf(datadoc,dxfpath, dxfratio,pdfpath,pdfname):
	FinalRatio= RetriveRatio(datadoc,dxfpath)
	hatched_areas = get_hatched_areas(dxfpath,FinalRatio)
	img=pdftoimg(datadoc)
	flipped_horizontal=flip(img)
	allcnts = []
	imgg = flipped_horizontal
	# imgtransparent1=imgg.copy()
	doc = fitz.open('pdf',datadoc)
	page2 = doc[0]
	rotationOld=page2.rotation
	derotationMatrix=page2.derotation_matrix
	pix=page2.get_pixmap()
	width=abs(page2.mediabox[2])+abs(page2.mediabox[0])
	height=abs(page2.mediabox[3])+abs(page2.mediabox[1])
	print('mediabox', width , height)
	if page2.rotation!=0:

	rotationangle = page2.rotation
	page2.set_rotation(0)
	ratio = pix.width/ img.shape[0]
	else:
	ratio = pix.width/ img.shape[1]
	rotationangle = 270

	allshapes=[]
	# Iterate through each polygon in metric units
	NewColors = []
	SimilarAreaDictionary=Create_DF(dxfpath,datadoc)
	i=0


	for polygon in hatched_areas:
	cntPoints = []
	cntPoints1 = []
	shapee = []
	# Convert each vertex from metric to pixel coordinates
	for vertex in polygon[0]:
	x = (vertex[0]) *dxfratio
	y = (vertex[1]) *dxfratio
	if rotationangle==0:
	if y<0:
	y=y*-1
	cntPoints.append([int(x), int(y)])
	cntPoints1.append([x, y])

	for poi in np.array(cntPoints1):
	x1, y1 = poi
	p1 = fitz.Point(x1,y1)
	# p1 = fitz.Point(x1,y1)
	p1=p1*derotationMatrix
	shapee.append([p1[0],p1[1]])

	shapee=np.flip(shapee,1)
	shapee=rotate_polygon(shapee,rotationangle,rotationOld,width,height)
	tol=2
	condition1 = (SimilarAreaDictionary['Area'] >= polygon[1] - tol) & (SimilarAreaDictionary['Area'] <= polygon[1] +tol)
	condition2 = (SimilarAreaDictionary['Perimeter'] >= polygon[2] -tol) & (SimilarAreaDictionary['Perimeter'] <= polygon[2] +tol)
	combined_condition = condition1 & condition2

	if any(combined_condition):

	index = np.where(combined_condition)[0][0]
	# print(SimilarAreaDictionary.at[index, 'Color'])
	NewColors=SimilarAreaDictionary.at[index, 'Color']
	else:
	NewColors=SimilarAreaDictionary.at[i, 'Color']

	# cv2.drawContours(imgg, [np.array(cntPoints)], -1, (NewColors), thickness=2)
	cv2.drawContours(imgg, [np.array(cntPoints)], -1, ([NewColors[2],NewColors[1],NewColors[0]]), thickness=-1)
	annot11 = page2.add_polygon_annot( points=shapee) # 'Polygon'
	annot11.set_border(width=0.2)
	annot11.set_colors(stroke=(int(NewColors[0])/255,int(NewColors[1])/255,int(NewColors[2])/255), fill= (int(NewColors[0])/255,int(NewColors[1])/255,int(NewColors[2])/255) )
	annot11.set_info(content='Area='+str(polygon[1])+' m^2',subject='ADR Team')
	annot11.set_opacity(0.9)
	# annot.set_line_ends(fitz.PDF_ANNOT_LE_DIAMOND, fitz.PDF_ANNOT_LE_CIRCLE)
	annot11.update()



	annot12 = page2.add_polygon_annot( points=shapee) # 'Polygon'
	annot12.set_border(width=0.2)
	annot12.set_colors(stroke=(int(NewColors[0])/255,int(NewColors[1])/255,int(NewColors[2])/255))
	annot12.set_info(content='Perimeter='+str(polygon[2])+' m',subject='ADR Team')
	annot12.set_opacity(0.8)
	# annot.set_line_ends(fitz.PDF_ANNOT_LE_DIAMOND, fitz.PDF_ANNOT_LE_CIRCLE)
	annot12.update()
	i += 1
	alpha = 0.8 # Transparency factor.

	page2.set_rotation(rotationOld)
	Correct_img=flip(imgg)

	image_new1 = cv2.addWeighted(Correct_img, alpha, img, 1 - alpha, 0)
	SimilarAreaDictionary = SimilarAreaDictionary.fillna(' ')
	gc,spreadsheet_service,spreadsheetId, spreadsheet_url , namepathArr=google_sheet_Legend.legendGoogleSheets(SimilarAreaDictionary , pdfname,pdfpath)
	# dbxTeam=tsadropboxretrieval.ADR_Access_DropboxTeam('user')
	# md, res =dbxTeam.files_download(path= pdfpath+pdfname)
	# data = res.content
	# doc=fitz.open("pdf", data)
	# list1=pd.DataFrame(columns=['content', 'creationDate', 'id', 'modDate', 'name', 'subject', 'title'])
	list1=pd.DataFrame(columns=['content', 'id', 'subject','color'])

	for page in doc:
	# Iterate through annotations on the page
	for annot in page.annots():
	# Get the color of the annotation
	annot_color = annot.colors
	if annot_color is not None:
	# annot_color is a dictionary with 'stroke' and 'fill' keys
	stroke_color = annot_color.get('stroke') # Border color
	fill_color = annot_color.get('fill') # Fill color
	if fill_color:
	v='fill'
	print('fill')
	if stroke_color:
	v='stroke'
	x,y,z=int(annot_color.get(v)[0]255),int(annot_color.get(v)[1]255),int(annot_color.get(v)[2]*255)
	list1.loc[len(list1)] =[annot.info['content'],annot.info['id'],annot.info['subject'],[x,y,z]]
	return doc,image_new1, SimilarAreaDictionary ,spreadsheetId, spreadsheet_url , namepathArr , list1,hatched_areas


	def deletemarkupsDXF(list1, dbPath, path):
	'''list1 : original markup pdf
	list2 : deleted markup pdf
	deletedrows : deleted markups - difference between both dfs
	'''

	myDict1 = eval(list1)
	list1 = pd.DataFrame(myDict1)

	dbxTeam = tsadropboxretrieval.ADR_Access_DropboxTeam('user')
	md, res = dbxTeam.files_download(path=dbPath + path)
	data = res.content
	doc = fitz.open("pdf", data)

	# Prepare a DataFrame for the annotations in the new PDF
	list2 = pd.DataFrame(columns=['content', 'id', 'subject', 'color'])

	for page in doc:
	# Iterate through annotations on the page
	for annot in page.annots():
	# Get the color of the annotation
	annot_color = annot.colors
	if annot_color is not None:
	# Check for fill or stroke color
	stroke_color = annot_color.get('stroke')
	fill_color = annot_color.get('fill')

	v = 'stroke' if stroke_color else 'fill'
	color = annot_color.get(v)
	if color:
	# Convert color to tuple and multiply by 255 to get RGB values
	color_tuple = (int(color[0] * 255), int(color[1] * 255), int(color[2] * 255))
	# Append annotation data to list2
	list2.loc[len(list2)] = [annot.info['content'], annot.info['id'], annot.info['subject'], color_tuple]

	# Ensure that colors are stored as tuples (which are hashable)
	list1['color'] = list1['color'].apply(lambda x: tuple(x) if isinstance(x, list) else x)

	# Find the deleted rows by checking the difference between original and current annotations
	deletedrows = pd.concat([list1, list2]).drop_duplicates(keep=False)

	print(deletedrows, len(deletedrows))
	flag = 0
	if len(deletedrows) != 0:
	flag = 1
	deletedrows = deletedrows[['content', 'id', 'subject', 'color']]
	# Drop rows where 'content' starts with 'Scale'
	deletedrows = deletedrows.drop(deletedrows.index[deletedrows['content'].str.startswith('Scale')])
	else:
	flag = 0

	return deletedrows