最近学习python爬虫,写了一个小例子.主要用来爬取bing壁纸.
源码如下:
‘’’
import requests
from bs4 import BeautifulSoup
import re
import os
from urllib.request import urlretrieve
import time
from email.header import Header
from email.mime.text import MIMEText
from email.utils import parseaddr, formataddr
import smtplib
class BingImgSave:
def __init__(self):
self.user_agent = 'Mozilla/4.0 (compatible; MSIE 5.5; Windows NT)'
self.headers={'User-Agent':self.user_agent}
self.baseurl='https://bing.ioliu.cn/'
self.nextpage = 0
def getHtml(self, urls):
r = requests.get(urls, headers=self.headers)
print(type(r))
return r
def parseHtml(self, response):
soup = BeautifulSoup(response.text, 'lxml', from_encoding='utf-8')
items = soup.find_all('div&#