def is_text_based_pdf(pages_text, min_chars: int = 500): combined_text = "".join(pages_text).strip() return len(combined_text) >= min_chars