win10 python3.9 测试通过:
import pdfplumber
# 读取PDF文档
pdf = pdfplumber.open("d:/电子书/终身成长.pdf")
# 获取页数
print("总页数:",len(pdf.pages))
print("-----------------------------------------")
# 读取第4页
first_page = pdf.pages[100]
print("本页:",first_page.page_number+1)
print("-----------------------------------------")
# 导出第4页文本
text = first_page.extract_text()
print(text)
##!!!! sudo apt-get update && sudo apt-get install espeak
##!!!!否则没声,只读英文
#Reading text to speech
import pyttsx3
# 初始化来获取语音引擎
engine = pyttsx3.init()
# # 去掉文本中的换行符
# text = text.replace('\n','')
# #text = "I am a teacher,and you!"
# # 调整人声类型
# voices = engine.getProperty('voices')
# engine.setProperty('voice', voices[0].id)
# # 调整语速,范围一般在0~500之间
# rate = engine.getProperty('rate')
# engine.setProperty('rate', 200)
rate = engine.getProperty('rate')
engine.setProperty('rate', 150)
# # 调整声量,范围在0~1之间
# volume = engine.getProperty('volume')
# engine.setProperty('volume',0.8)
# 朗读文本
engine.say(text)
#engine.save_to_file(text, 'test.mp3')
engine.runAndWait()