mindee · felixdittrich92 · Jul 10, 2023 · Jul 4, 2023 · Jul 4, 2023 · Jul 10, 2023
diff --git a/doctr/io/pdf.py b/doctr/io/pdf.py
@@ -3,7 +3,6 @@
 # This program is licensed under the Apache License 2.0.
 # See LICENSE or go to <https://opensource.org/licenses/Apache-2.0> for full license details.
 
-from pathlib import Path
 from typing import Any, List, Optional
 
 import numpy as np
@@ -31,16 +30,12 @@ def read_pdf(
         scale: rendering scale (1 corresponds to 72dpi)
         rgb_mode: if True, the output will be RGB, otherwise BGR
         password: a password to unlock the document, if encrypted
-        kwargs: additional parameters to :meth:`pypdfium2.PdfDocument.render_to`
+        kwargs: additional parameters to :meth:`pypdfium2.PdfPage.render`
 
     Returns:
         the list of pages decoded as numpy ndarray of shape H x W x C
     """
 
-    if isinstance(file, Path):
-        file = str(file)
-
     # Rasterise pages to numpy ndarrays with pypdfium2
-    pdf = pdfium.PdfDocument(file, password=password)
-    renderer = pdf.render_to(pdfium.BitmapConv.numpy_ndarray, scale=scale, rev_byteorder=rgb_mode, **kwargs)
-    return [img for img, _ in renderer]
+    pdf = pdfium.PdfDocument(file, password=password, autoclose=True)
+    return [page.render(scale=scale, rev_byteorder=rgb_mode, **kwargs).to_numpy() for page in pdf]
diff --git a/pyproject.toml b/pyproject.toml
@@ -37,7 +37,7 @@ dependencies = [
     "scipy>=1.4.0,<2.0.0",
     "h5py>=3.1.0,<4.0.0",
     "opencv-python>=4.5.0,<5.0.0",
-    "pypdfium2>=3.3.0,<4.0.0",
+    "pypdfium2>=4.0.0,<5.0.0",
     "pyclipper>=1.2.0,<2.0.0",
     "shapely>=1.6.0,<3.0.0",
     "langdetect>=1.0.9,<2.0.0",