fabriquedoc-backend/convert_pdf.py

28 lines
931 B
Python
Raw Normal View History

2023-05-17 19:53:44 +00:00
import os
from wand.color import Color
from wand.image import Image
def convert_pdf(filename, filetype, output_path, resolution=300):
""" Convert a PDF into images.
All the pages will give a single png file with format:
{pdf_filename}-{page_number}.png
The function removes the alpha channel from the image and
replace it with a white background.
"""
all_pages = Image(filename=filename, resolution=resolution)
for i, page in enumerate(all_pages.sequence):
with Image(page) as img:
img.format = filetype
img.background_color = Color('white')
img.alpha_channel = 'remove'
image_filename = os.path.splitext(os.path.basename(filename))[0]
2023-05-17 20:00:09 +00:00
image_filename = f'{image_filename}-{i:03}.{filetype}'
2023-05-17 19:53:44 +00:00
image_filename = os.path.join(output_path, image_filename)
img.save(filename=image_filename)