#coding:utf-8 #__author__='wang' import urllib,requests,os from bs4 import BeautifulSoup os.mkdir(u'风景图片子页图片') def get_data(): url = "http://www.ivsky.com/tupian/ziranfengguang/" html = requests.get(url).content bs_coup = BeautifulSoup(html, 'lxml') result = bs_coup.select('ul.ali li div a') return result def get_page(result_list): # print result_list for a in result_list: page = a.get('href') # print page title = a.get('title') os.chdir(u'风景图片子页图片') os.mkdir(title) os.chdir(title) get_page_html(title,page) def get_page_html(name,lianjie): url = 'http://www.ivsky.com'+lianjie html = requests.get(url).content bs_coup = BeautifulSoup(html, 'lxml') result = bs_coup.select('ul.pli li img') down_load(result) def down_load(list): i = 1 for a in list: src = a.get('src') urllib.urlretrieve(src, '%s.jpg' % i) i += 1 os.chdir(os.path.pardir) os.chdir(os.path.pardir) if __name__=='__main__': tupian = get_data() get_page(tupian)
bs4获取风景图片
最新推荐文章于 2023-01-02 12:13:40 发布