Spaces:
Sleeping
Sleeping
File size: 2,144 Bytes
80a3675 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 | #!/usr/bin/env python3
"""PDF to Image (JPG/PNG) converter using pdf2image (poppler)."""
import argparse, json, sys, os, zipfile
from pathlib import Path
def convert(input_path, output_path, fmt='jpg', dpi=150):
from pdf2image import convert_from_path
images = convert_from_path(input_path, dpi=dpi, fmt=fmt)
if len(images) == 1:
ext = 'jpg' if fmt.lower() in ('jpg', 'jpeg') else fmt.lower()
if not output_path:
output_path = str(Path(input_path).with_suffix(f'.{ext}'))
save_fmt = 'JPEG' if ext in ('jpg', 'jpeg') else ext.upper()
images[0].save(output_path, save_fmt, quality=95)
return output_path
else:
out_dir = Path(output_path).parent
base = Path(input_path).stem
ext = 'jpg' if fmt.lower() in ('jpg', 'jpeg') else fmt.lower()
zip_path = str(out_dir / f'{base}_images.zip')
with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zf:
for i, img in enumerate(images):
img_name = f'{base}_page_{i+1}.{ext}'
img_path = str(out_dir / img_name)
save_fmt = 'JPEG' if ext in ('jpg', 'jpeg') else ext.upper()
img.save(img_path, save_fmt, quality=95)
zf.write(img_path, img_name)
os.remove(img_path)
return zip_path
def main():
parser = argparse.ArgumentParser(description='Convert PDF to images')
parser.add_argument('--input', required=True)
parser.add_argument('--output', required=True)
parser.add_argument('--format', default='jpg', choices=['jpg', 'png'])
parser.add_argument('--dpi', type=int, default=150)
args = parser.parse_args()
try:
result = convert(args.input, args.output, args.format, args.dpi)
print(json.dumps({"success": True, "output": result, "message": f"PDF converted to {args.format.upper()} images"}))
except Exception as e:
print(json.dumps({"success": False, "output": "", "message": str(e)}))
sys.exit(1)
if __name__ == '__main__':
main()
|