import requests
import bs4
from bs4 import BeautifulSoup
def getHtmlText(url):
try:
r= requests.get(url,timeout=30)
r.raise_for_status
r.encoding=r.apparent_encoding
return r.text
except:
print("加载超时")
def fillUnivList(ulist,html):
soup=BeautifulSoup(html,'html.parser')
for tr in soup.find("tbody").children:
if isinstance(tr,bs4.element.Tag):
tds=tr('td')
ulist.append([tds[0].string,tds[1].string,tds[3].string])
pass
def printUnivlist(ulist,num):
print("{:^10}\t{:^6}\t{:^10}".format("排名","学校","总分"))
for i in range(num):
u=ulist[i]
print("{:^10}\t{:^6}\t{:^10}".format(u[0],u[1],u[2]))
#print(u[0])
def main():
uinfo=[]
url = "http://www.zuihaodaxue.cn/zuihaodaxuepaiming2016.html"
html=getHtmlText(url)
fillUnivList(uinfo,html)
printUnivlist(uinfo,20)
main()
优化后(优化中文字符对齐,chr(12288))
import requests
import bs4
from bs4 import BeautifulSoup
def getHtmlText(url):
try:
r= requests.get(url,timeout=30)
r.raise_for_status
r.encoding=r.apparent_encoding
return r.text
except:
print("加载超时")
def fillUnivList(ulist,html):
soup=BeautifulSoup(html,'html.parser')
for tr in soup.find("tbody").children:
if isinstance(tr,bs4.element.Tag):
tds=tr('td')
ulist.append([tds[0].string,tds[1].string,tds[3].string])
pass
def printUnivlist(ulist,num):
tplt= "{0:^10}\t{1:{3}^10}\t{2:^10}"//详细说明:{0:^10} 0表示第几个元素(这里就代表排名)^表示按中对齐10表示宽度
print(tplt.format("排名","学校","总分",chr(12288)))
for i in range(num):
u=ulist[i]
print(tplt.format(u[0],u[1],u[2],chr(12288)))
#print(u[0])
def main():
uinfo=[]
url = "http://www.zuihaodaxue.cn/zuihaodaxuepaiming2016.html"
html=getHtmlText(url)
fillUnivList(uinfo,html)
printUnivlist(uinfo,20)
main()