Spaces:

broadfield-dev
/

PDF_2_Image

Running

App Files Files Community

PDF_2_Image / app.py

broadfield-dev

Update app.py

434e44f verified 3 days ago

raw

history blame contribute delete

8.33 kB

	import os
	import tempfile
	import logging
	from typing import List
	import math

	import gradio as gr
	import requests
	from PIL import Image
	from pdf2image import convert_from_path, convert_from_bytes
	from pdf2image.exceptions import PDFInfoNotInstalledError, PDFPageCountError

	logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s")
	logger = logging.getLogger(__name__)

	def stitch_images_vertically(images: List[Image.Image]) -> Image.Image:
	if not images:
	return None

	if not all(isinstance(i, Image.Image) for i in images):
	logger.error("Non-Image object found in list for vertical stitching.")
	return None

	max_width = max(img.width for img in images)
	total_height = sum(img.height for img in images)
	stitched_image = Image.new('RGB', (max_width, total_height), (255, 255, 255))

	current_y = 0
	for img in images:
	stitched_image.paste(img, (0, current_y))
	current_y += img.height

	return stitched_image

	def stitch_images_in_grid(images: List[Image.Image], num_columns: int, page_order: str) -> Image.Image:
	if not images:
	return None

	if page_order == "Top-to-Bottom (down)":
	num_images = len(images)
	num_rows = math.ceil(num_images / num_columns)
	columns = [images[inum_rows : (i+1)num_rows] for i in range(num_columns)]
	else: # Default to "Left-to-Right (across)"
	columns = [images[i::num_columns] for i in range(num_columns)]

	stitched_columns = [stitch_images_vertically(col) for col in columns if col]

	if not stitched_columns:
	return None

	max_height = max(col.height for col in stitched_columns if col)
	total_width = sum(col.width for col in stitched_columns if col)
	grid_image = Image.new('RGB', (total_width, max_height), (255, 255, 255))

	current_x = 0
	for col_img in stitched_columns:
	if col_img:
	grid_image.paste(col_img, (current_x, 0))
	current_x += col_img.width

	return grid_image

	def process_pdf(pdf_file, pdf_url, dpi, num_columns, crop_top, crop_bottom, crop_left, crop_right, hide_annotations, page_order, progress=gr.Progress()):
	pdf_input_source = None
	is_bytes = False
	source_name = "document"

	progress(0, desc="Validating input...")
	if pdf_file is not None:
	logger.info(f"Processing uploaded file: {pdf_file.name}")
	pdf_input_source = pdf_file.name
	source_name = os.path.splitext(os.path.basename(pdf_file.name))[0]
	elif pdf_url and pdf_url.strip():
	url = pdf_url.strip()
	logger.info(f"Processing file from URL: {url}")
	progress(0.1, desc="Downloading PDF from URL...")
	try:
	response = requests.get(url, timeout=45)
	response.raise_for_status()
	pdf_input_source = response.content
	source_name = os.path.splitext(os.path.basename(url.split('?')[0]))[0]
	is_bytes = True
	except requests.RequestException as e:
	raise gr.Error(f"Failed to download PDF from URL. Error: {e}")
	else:
	raise gr.Error("Please upload a PDF file or provide a valid URL.")

	progress(0.3, desc="Converting PDF pages to images...")
	logger.info(f"Using DPI: {dpi}, Hide Annotations: {hide_annotations}")
	try:
	if is_bytes:
	images = convert_from_bytes(pdf_input_source, dpi=dpi, hide_annotations=hide_annotations)
	else:
	images = convert_from_path(pdf_input_source, dpi=dpi, hide_annotations=hide_annotations)
	except (PDFInfoNotInstalledError, FileNotFoundError):
	raise gr.Error("Server configuration error: Poppler dependency is missing.")
	except (PDFPageCountError, Exception) as e:
	raise gr.Error(f"Failed to process the PDF. It might be corrupted or password-protected. Error: {e}")

	if not images:
	raise gr.Error("Could not extract any pages from the PDF. The file might be empty or invalid.")

	logger.info(f"Successfully converted {len(images)} pages to images.")

	cropped_images = []
	if crop_top > 0 or crop_bottom > 0 or crop_left > 0 or crop_right > 0:
	progress(0.6, desc="Cropping images...")
	for i, img in enumerate(images):
	width, height = img.size
	left, top, right, bottom = crop_left, crop_top, width - crop_right, height - crop_bottom
	if left >= right or top >= bottom:
	raise gr.Error(f"Crop values are too large for page {i+1}. The page dimensions are {width}x{height}, but crop settings result in an invalid area.")
	cropped_images.append(img.crop((left, top, right, bottom)))
	else:
	cropped_images = images

	progress(0.7, desc=f"Stitching {len(cropped_images)} images together...")

	if num_columns > 1:
	stitched_image = stitch_images_in_grid(cropped_images, num_columns, page_order)
	else:
	stitched_image = stitch_images_vertically(cropped_images)

	if stitched_image is None:
	raise gr.Error("Image stitching failed.")
	logger.info("Image stitching complete.")

	progress(0.9, desc="Saving final image...")
	with tempfile.NamedTemporaryFile(delete=False, suffix=".png", prefix=f"{source_name}_stitched_") as tmp_file:
	stitched_image.save(tmp_file.name, "PNG")
	output_path = tmp_file.name

	logger.info(f"Final image saved to temporary path: {output_path}")
	progress(1, desc="Done!")

	return output_path, output_path

	with gr.Blocks(theme=gr.themes.Soft()) as demo:
	gr.Markdown(
	"""
	# PDF Page Stitcher 📄 ➡️ 🖼️
	Upload a PDF file or provide a URL. This tool will convert every page of the PDF into an image
	and then append them to create a single image that you can download.
	"""
	)
	with gr.Row():
	with gr.Column(scale=1):
	with gr.Tabs():
	with gr.TabItem("Upload PDF"):
	pdf_file_input = gr.File(label="Upload PDF File", file_types=[".pdf"])
	with gr.TabItem("From URL"):
	pdf_url_input = gr.Textbox(label="PDF URL", placeholder="e.g., https://arxiv.org/pdf/1706.03762.pdf")

	dpi_slider = gr.Slider(minimum=100, maximum=600, step=5, value=200, label="Image Resolution (DPI)")
	columns_slider = gr.Slider(minimum=1, maximum=10, step=1, value=1, label="Number of Columns")

	with gr.Accordion("Advanced Options", open=False):
	hide_annotations_toggle = gr.Checkbox(value=True, label="Hide PDF Annotations (Links/Highlights)", info="Turn this on to remove the colored boxes that can appear around links and references.")
	page_order_radio = gr.Radio(["Left-to-Right (across)", "Top-to-Bottom (down)"], value="Left-to-Right (across)", label="Multi-Column Page Order", info="Determines how pages fill the columns.")
	with gr.Row():
	crop_left = gr.Slider(minimum=0, maximum=500, step=10, value=0, label="Crop Left")
	crop_right = gr.Slider(minimum=0, maximum=500, step=10, value=0, label="Crop Right")
	with gr.Row():
	crop_top = gr.Slider(minimum=0, maximum=500, step=10, value=0, label="Crop Top")
	crop_bottom = gr.Slider(minimum=0, maximum=500, step=10, value=0, label="Crop Bottom")

	submit_btn = gr.Button("Stitch PDF Pages", variant="primary")

	with gr.Column(scale=2):
	gr.Markdown("## Output")
	output_image_preview = gr.Image(label="Stitched Image Preview", type="filepath", interactive=False, height=600)
	output_image_download = gr.File(label="Download Stitched Image", interactive=False)

	submit_btn.click(
	fn=process_pdf,
	inputs=[
	pdf_file_input,
	pdf_url_input,
	dpi_slider,
	columns_slider,
	crop_top,
	crop_bottom,
	crop_left,
	crop_right,
	hide_annotations_toggle,
	page_order_radio
	],
	outputs=[output_image_preview, output_image_download]
	)

	demo.launch(server_name="0.0.0.0", server_port=7860, debug=True)