Spaces:

kshdes37
/

cadspace

Runtime error

App Files Files Community

cadspace / CADFusion /src /test /f1_eval.py

kshdes37

Upload 50 files

91daf98 verified 3 months ago

raw

history blame contribute delete

3.34 kB

	import json
	import re
	import argparse

	"""
	We did not implement the Hungarian matching algorithm from text2cad, but provided a vanilla matching for f1. It is because
	1. We argue that CAD scenarios are too complicated to be evaluated with a simple matching algorithm, especially when performed on the primitive level. Moreover, matching every primitive exactly is against the goal of our framework which attempt to encourage CAD models generate visually correct objects instead of accurate primitives compared to the ground truth.
	2. In our exploration, discrepancies on the number of primitives between model generation and the ground truth usually indicates the entire failure of the sketch so that using any of the algorithm does not affect the final evaluation result anyway.
	3. Our evaluation is a lower bound of the performance of the model on the matching algorithm, therefore it does not affect the overall integrety of our framework.

	We encourage users to implement their own matching algorithm if they want to evaluate the model with a more strict metric.
	"""

	parser = argparse.ArgumentParser(description='Evaluate F1 scores for generated sketches.')
	parser.add_argument('--test-path', type=str, default='data/sl_data/test.jsonl', help='Path to the JSONL file containing test data')
	parser.add_argument('--file_path', type=str, required=True, help='Path to the JSONL file containing generated sketches.')
	args = parser.parse_args()
	file_path = args.file_path
	data_path = args.test_path
	with open(data_path, 'r') as f:
	data = json.load(f)

	def find_f1(ground_truth, pred, token):
	num_tok_gt = len(re.findall(token, ground_truth))
	num_tok_pred = len(re.findall(token, pred))
	# print(num_tok_gt, num_tok_pred)
	min_tok = min(num_tok_gt, num_tok_pred)
	if min_tok <= 0:
	return -1
	tok_recall = min_tok / num_tok_gt
	tok_precision = min_tok / num_tok_pred
	tok_f1 = 2 * tok_recall * tok_precision / (tok_recall + tok_precision)
	return tok_f1

	with open(file_path, 'r') as f:
	gen = json.load(f)
	line = []
	arc = []
	circle = []
	ext = []
	for i in range(1000):
	ground_truth = data[i]['output']
	pred = gen[i]['output']
	ext_f1 = find_f1(ground_truth, pred, r'<extrude_end>')
	if ext_f1 > 0:
	ext.append(ext_f1)

	skext_gt = ground_truth.split('<extrude_end>')[:-1]
	skext_pred = pred.split('<extrude_end>')[:-1]
	min_len_skext = min(len(skext_gt), len(skext_pred))
	if min_len_skext == 0:
	continue
	line_f1 = 0
	arc_f1 = 0
	circle_f1 = 0
	for gt, pr in zip(skext_gt, skext_pred):
	line_f1 += find_f1(gt, pr, r'line.*?<curve_end>')
	arc_f1 += find_f1(gt, pr, r'arc.*?<curve_end>')
	circle_f1 += find_f1(gt, pr, r'circle.*?<curve_end>')

	line_f1 = line_f1 / min_len_skext
	arc_f1 = arc_f1 / min_len_skext
	circle_f1 = circle_f1 / min_len_skext
	if line_f1 > 0:
	line.append(line_f1)
	if arc_f1 > 0:
	arc.append(arc_f1)
	if circle_f1 > 0:
	circle.append(circle_f1)
	line_avg = sum(line) / len(line)
	arc_avg = sum(arc) / len(arc)
	circle_avg = sum(circle) / len(circle)
	avgf1 = (line_avg + arc_avg + circle_avg) / 3
	print(file_path, line_avg, arc_avg, circle_avg, avgf1, sum(ext) / len(ext))