diff --git a/deepdoc/parser/pdf_parser.py b/deepdoc/parser/pdf_parser.py index 29947f7d93..909b89d5cc 100644 --- a/deepdoc/parser/pdf_parser.py +++ b/deepdoc/parser/pdf_parser.py @@ -23,7 +23,7 @@ from PIL import Image, ImageDraw import numpy as np from timeit import default_timer as timer -from PyPDF2 import PdfReader as pdf2_read +from pypdf import PdfReader as pdf2_read from api.utils.file_utils import get_project_base_directory from deepdoc.vision import OCR, Recognizer, LayoutRecognizer, TableStructureRecognizer diff --git a/requirements.txt b/requirements.txt index e50d7f86cc..1752b7759a 100644 --- a/requirements.txt +++ b/requirements.txt @@ -79,3 +79,4 @@ word2number==1.1 xgboost==2.1.0 xpinyin==0.7.6 zhipuai==2.0.1 +pypdf==4.3.0 diff --git a/requirements_arm.txt b/requirements_arm.txt index 3650ca538d..1a8f6a137e 100644 --- a/requirements_arm.txt +++ b/requirements_arm.txt @@ -153,3 +153,4 @@ groq==0.9.0 wikipedia==1.4.0 Bio==1.7.1 arxiv==2.1.3 +pypdf==4.3.0 diff --git a/requirements_dev.txt b/requirements_dev.txt index ee08297370..f518cab644 100644 --- a/requirements_dev.txt +++ b/requirements_dev.txt @@ -138,3 +138,4 @@ groq==0.9.0 wikipedia==1.4.0 Bio==1.7.1 arxiv==2.1.3 +pypdf==4.3.0