2023-05-17 19:53:44 +00:00
|
|
|
import os
|
|
|
|
|
|
|
|
from wand.color import Color
|
|
|
|
from wand.image import Image
|
|
|
|
|
|
|
|
|
|
|
|
def convert_pdf(filename, filetype, output_path, resolution=300):
|
|
|
|
""" Convert a PDF into images.
|
|
|
|
|
|
|
|
All the pages will give a single png file with format:
|
|
|
|
{pdf_filename}-{page_number}.png
|
|
|
|
|
|
|
|
The function removes the alpha channel from the image and
|
|
|
|
replace it with a white background.
|
|
|
|
"""
|
|
|
|
all_pages = Image(filename=filename, resolution=resolution)
|
|
|
|
for i, page in enumerate(all_pages.sequence):
|
|
|
|
with Image(page) as img:
|
|
|
|
img.format = filetype
|
|
|
|
img.background_color = Color('white')
|
|
|
|
img.alpha_channel = 'remove'
|
|
|
|
|
|
|
|
image_filename = os.path.splitext(os.path.basename(filename))[0]
|
2023-05-17 20:00:09 +00:00
|
|
|
image_filename = f'{image_filename}-{i:03}.{filetype}'
|
2023-05-17 19:53:44 +00:00
|
|
|
image_filename = os.path.join(output_path, image_filename)
|
|
|
|
|
|
|
|
img.save(filename=image_filename)
|