Spaces:

VashuTheGreat2
/

ML-Learner

Running

App Files Files Community

ML-Learner / python_backend /refactor_problems.py

VashuTheGreat2

Upload folder using huggingface_hub

c01955c verified about 1 month ago

raw

history blame contribute delete

3.08 kB


	import json
	import ast
	import re

	def clean_and_refactor(code, function_name):
	# 1. First, UNWRAP anything that was double-wrapped or already wrapped
	# Remove any existing "class Solution:" lines and unindent
	lines = code.split('\n')
	unindented_lines = []
	for line in lines:
	if line.strip() == "class Solution:":
	continue
	# Remove one level of indentation (4 spaces) if it was wrapped
	if line.startswith(" "):
	unindented_lines.append(line[4:])
	else:
	unindented_lines.append(line)

	code = "\n".join(unindented_lines)

	# Remove redundant (self, self, ...)
	code = code.replace("(self, self, ", "(self, ")
	code = code.replace("(self, self)", "(self)")

	# 2. Apply the intended refactors (idempotent)
	code = code.replace("from tinygrad.tensor import Tensor", "import numpy as np")
	code = code.replace("tinygrad.tensor import Tensor", "numpy as np")

	# Replace Tensor( ... ) calls with np.array( ... ) - only if not torch.
	code = code.replace("Tensor(-1)", "-1")
	code = re.sub(r'(?<!torch\.)\bTensor\s*\(', 'np.array(', code)

	# Replace Tensor type hints with np.ndarray
	code = re.sub(r'[:]\s*(?<!torch\.)\bTensor\b', ': np.ndarray', code)
	code = re.sub(r'->\s*(?<!torch\.)\bTensor\b', '-> np.ndarray', code)

	# Catch-all for standalone Tensor
	code = re.sub(r'(?<!torch\.)\bTensor\b', 'np.ndarray', code)

	# 3. Re-wrap correctly
	lines = code.split('\n')
	imports = []
	body = []
	for line in lines:
	if line.strip().startswith(("import ", "from ")):
	imports.append(line)
	else: body.append(line)

	final_body = []
	found_func = False
	for line in body:
	if line.strip().startswith("def "):
	# Ensure only ONE self is present
	if "(self, " not in line and "(self)" not in line:
	line = re.sub(r'def\s+(\w+)\s*\(', r'def \1(self, ', line)
	line = line.replace("self, )", "self)")
	found_func = True
	final_body.append(" " + line if (line.strip() or found_func) else line)

	return "\n".join(imports) + "\n\n" + "class Solution:\n" + "\n".join(final_body)

	def main():
	with open("problems.json", "r") as f:
	problems = json.load(f)

	for p in problems:
	func_name = p.get("function_name", "unknown")
	if func_name == "unknown":
	match = re.search(r"def (\w+)\s*\(", p["starter_code"])
	if match: func_name = match.group(1)
	p["function_name"] = func_name

	p["starter_code"] = clean_and_refactor(p["starter_code"], func_name)
	p["solution_code"] = clean_and_refactor(p["solution_code"], func_name)

	# Test cases are likely already fine (lists), but let's double check they aren't double-nested
	# Actually they looked okay in the previous view.

	with open("problems.json", "w") as f:
	json.dump(problems, f, indent=2)

	if __name__ == "__main__":
	main()