1.安装

pip install pdfplumber

 

2.代码

import pdfplumber as pb

file_handle = open('out.txt', mode='w', encoding='utf-8')
# 读取PDF文档
pdf = pb.open("1.pdf")
# 绝对路径也可以这么写,下同
#    path = 'D:\\GKProject\\需求文档.pdf'
# 获取页数
a = len(pdf.pages)
print("当前页:", a)
print("-----------------------------------------")

i = 0
for i in range(0, a):
    first_page = pdf.pages[i]
    print("本页:", first_page.page_number)
    print("-----------------------------------------")
    # 导出当前页文本
    text = first_page.extract_text()
    # print(text)
    file_handle.write(text)

 

posted on 2023-03-02 21:41  大话人生  阅读(85)  评论(0)    收藏  举报