而我想读取里面的信息,转换成一个类或者另一个对象
def GetUrl(self):
auth = qiniu.Auth(self.__access_key, self.__secret_key)
base_url = "84320875399.pdf"
private_url = auth.private_download_url(base_url)
return private_url
def DownloadPdf(self,url:str):
response = requests.get(url)
pdf_data = response.content
return pdf_data
def TryParsePdf(self,data):
pdf_file = io.BytesIO(data)
pdf_reader = PdfReader(pdf_file)
for page in pdf_reader.pages:
# print(page.extract_text())
text=page.extract_text(0)
rows = text.split('\n')
for row in rows:
print(row)
def PrasePdf(self):
url=self.GetUrl()
data=self.DownloadPdf(url)
if self.TryParseDef(data):
print("success")
如果
pypdf2
没有实现这个功能,请告诉我我可以选择什么库
帮助我!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!