# -*-coding:utf-8-*-
from bs4 import BeautifulSoup
import requests, time
url = 'https://knewone.com/discover?page='
def get_page(url, data=None): # 获取页面
wb_data = requests.get(url)
soup = BeautifulSoup(wb_data.text, 'html.parser')
imgs = soup.select('a.cover-inner > img')
titles = soup.select('section.content > h4 >a')
links = soup.select('section.content > h4 > a')
# 数据打印
if data is None:
for img, title, link in zip(imgs, titles, links):
data = {
'img': img.get('src'),
'title': title.get('title'),
'link': link.get('href')
}
print data
def get_more_pages(start, end):
for one in range(start, end):
get_page(url + str(one))
time.sleep(2) # 获取链接
get_more_pages(1, 10) # 调用函数