Spaces:
Sleeping
Sleeping
| import subprocess | |
| import os | |
| import shutil | |
| def rename_and_move_files(root_folder): | |
| for foldername, subfolders, filenames in os.walk(root_folder): | |
| for filename in filenames: | |
| if filename.endswith('.md'): | |
| source_path = os.path.join(foldername, filename) | |
| dest_path = os.path.join(root_folder, filename.replace('.md', '_PDF_FILE.txt')) | |
| os.rename(source_path, dest_path) | |
| shutil.rmtree(foldername) | |
| def process_pdf_performance(path): | |
| path_extracted_pdf = path+"/extracted_pdf/" | |
| os.makedirs(path_extracted_pdf, exist_ok=True) | |
| for root, dirs, files in os.walk(path): | |
| for file in files: | |
| if file.endswith('.pdf'): | |
| print("FILE IS ", os.path.join(root, file)) | |
| file_proper_format = file.replace(" ", "\ ") | |
| os.system(f"marker_single {os.path.join(root, file_proper_format)} {path_extracted_pdf} --batch_multiplier 10") | |
| rename_and_move_files(path_extracted_pdf) | |