import requests
from bs4 import BeautifulSoup
def getHTMLText(url):
try:
r = requests.get(url,timeout=30)
r.raise_for_status()
r.encoding=r.apparent_encoding
return r.text
except:
return ""
def SoupDemo(html):
Work = ""
for i in range(len(soup.select('#content'))):
#print(soup.select('#content')[i].get_text().strip())
Work +=soup.select('#content')[i].get_text().strip()
return Work
def WriteText(name,Text):
f = open(name,'w')
f.write(Text)
f.close()
main():
for i in range(1,101):
url="https://www.runoob.com/python/python-exercise-example{}.html".format(i)
Text=getHTMLText(url)
Work=SoupDemo(Text)
WriteText('work{}',Work).format(i)
main()
爬取菜鸟教程python题100列
最新推荐文章于 2022-11-15 08:15:00 发布