from bs4 import BeautifulSoup
import requests
import time
t0 = time.perf_counter()
url = "https://www.europeanchamber.com.cn/en/press-releases"
headers = {
'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/47.0.2526.80 Safari/537.36'
}
html = requests.get(url,headers = headers).content
t1 = time.perf_counter()
soup = BeautifulSoup(html, "lxml").select(".panel-default")
i=0
t2 = time.perf_counter()
for sp in soup:
i = i +1
print(str(i), sp.select(".chapter-category")[0].text.strip()[:10], sp.select("h3 a")[0].text)
print("https://www.europeanchamber.com.cn" + sp.select("h3 a")[0].attrs['href'])
t3 = time.perf_counter()
#各个步骤所耗时间
print("read:", t1-t0)
print("soup:", t2-t1)
print("print:", t3-t2)