pip install readability-lxml
>>> import requests
>>> from readability import Document
>>> respose = requests.get('https://segmentfault.com/a/1190000005768094')
>>> doc = Document(respose.text)
>>> doc.title()
'Python利用正则抓取网页内容保存到本地 - python - SegmentFault 思否'
>>>