import re def clean_text(text: str) -> str: text = text.lower() text = re.sub(r"\[\*\*.*?\*\*\]", "", text) # remove PHI text = re.sub(r"\n+", " ", text) return text.strip()