使用python中的etree库和request爬取网络美女图片
代码如下:
```python
from lxml import etree
import urllib.request,os,time
class OuMeiSpider(object):
def __init__(self,start_page,end_page):
self.start_page = start_page
self.end_page = end_page
self.first_url = 'http://sc.chinaz.com/tag_tupian/OuMeiMeiNv.html'
self.url = 'http://sc.chinaz.com/tag_tupian/OuMeiMeiNv_{}.html'
#使用浏览器的请求头进行伪装,防止被识别为爬虫,从而阻止项目运行不成功
self.headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/76.0.3809.100 Safari/537.36',}
def get_request(self,page):
#判断使得否为第一页
if page == 1:
url = self.first_url
else:
url = self.url.format(page)
#构建请求对象
request = urllib.request.Request(url=url,headers=