import pdfplumber
with pdfplumber.open(r'pdf file.pdf') as file:
for page in file.pages:
text = page.extract_text() #得到具体每一页的文本内容