使用beautifulsoup 爬取小说,并整合到txt中。
"""
======================
@Auther:CacheYu
@Time:2019/9/16:16:09
======================
"""
# -*- coding:utf-8 -*-
import urllib.request
import urllib.error
import bs4
from bs4 import BeautifulSoup
def readdown(url):
soup = BeautifulSoup(urllib.request.urlopen(url), 'html.parser')
fixed_html = soup.prettify()
table = soup.find('table', attrs={'id': 'tabletxt'})
# # if isinstance(table, bs4.element.Tag):
# tds = table.find_all('td')
i = table.find('i').string
print(i)
div = table.find_all('div', attrs={'class': 'txt'})
content = div[0].get_text().strip()
couple = i