def extract(text, paper=None, logger=logger):
# try using pypdf2/pdfminer
try:
pdf = paper._read_document()
pdfReader = PdfFileReader(pdf)
title = pdfReader.getDocumentInfo().title
value_text, value_result = title, title
source_type = "extracted"
source_detail = "pdf metadata"
if title:
return (value_text, value_result, source_type, source_detail)
else:
return None
except:
# search for title or return None
# Though currently there is no search function
return None
评论列表
文章目录