Source code for formhtr.pdf_utils

from __future__ import annotations

import numpy as np

from .libs.pdf_to_image import convert_pdf_to_image



[docs]
def get_pdf_dimensions(*, pdf_file: str, dpi: int = 300) -> dict[str, int]:
    """Pixel size of the first PDF page after rasterization.

    Args:
        pdf_file: Path to the PDF.
        dpi: Rasterization resolution.

    Returns:
        Dict with keys ``height`` and ``width`` in pixels.
    """
    image = np.array(convert_pdf_to_image(pdf_file, dpi=dpi))
    return {
        "height": int(image.shape[0]),
        "width": int(image.shape[1]),
    }