def getPDFContent(path):
content = ""
pdf = PyPDF2.PdfFileReader(path, "rb")
for i in range(0, pdf.getNumPages()):
content += pdf.getPage(i).extractText() + "\n"
content = " ".join(content.strip().split())
return content
评论列表
文章目录