利用PyPDF2读取PDF文件内容保存到本地TXT
from PyPDF2.pdf import PdfFileReader
import pandas as pd
def Pdf_to_txt(pdf):
for i in range(0, pdf.getNumPages()):
title = []
lin1, lin2, lin3, lin4, lin5, lin6, lin7, lin8 = [], [], [], [], [], [], [], []
extractedText = pdf.getPage(i).extractText()
text = extractedText.split('\n')
num = 0
for lin in text: