Python——用爬虫下载妹子图

最新推荐文章于 2020-12-10 22:03:43 发布

ChenTianSaber

最新推荐文章于 2020-12-10 22:03:43 发布

阅读量747

点赞数

分类专栏：我的学习笔记文章标签： python 爬虫

本文链接：https://blog.csdn.net/ChenTianSaber/article/details/52267143

版权

我的学习笔记专栏收录该内容

13 篇文章 0 订阅

订阅专栏

import urllib.request
import re

def agentIp():
    url='http://www.kuaidaili.com/'
    html=urllib.request.urlopen(url)
    content=html.read().decode('utf-8')
    pat=re.compile(r'(((2[0-5][0-5]|1[0-9][0-9]|[0-9]?[0-9])\.)((2[0-5][0-5]|1[0-9][0-9]|[0-9]?[0-9])\.)((2[0-5][0-5]|1[0-9][0-9]|[0-9]?[0-9])\.)(2[0-5][0-5]|1[0-9][0-9]|[0-9]?[0-9]))')
    p=re.findall(pat,str(content))
    return (p[0][0])

def openTargetUrl():
    url='http://jandan.net/ooxx/page-2099#comments'
    req=urllib.request.Request(url)
    req.add_header('User-agent','Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.2661.102 Safari/537.36')
    res=urllib.request.urlopen(req)
    content=res.read().decode('utf-8')
    #print(content)
    pat=re.compile(r'<img src="http://.*\.jpg')
    p=re.findall(pat,str(content))
    L=[]
    for x in p:
        x=x[10:]
        L.append(x)
    return L

def download(L):
    for url in L:
        name=url.split("/")[-1]
        req = urllib.request.Request(url)
        req.add_header('User-agent',
                       'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.2661.102 Safari/537.36')
        res = urllib.request.urlopen(req)
        content = res.read()
        with open("D:\Download\PythonJPG\\"+name,'wb') as f:
            f.write(content)


def main():
    download(openTargetUrl())
    print("图片下载完成！")
    #agentIp()

if __name__ == '__main__':
    main()

左边是代码，右边是下载的图片，代码略简单，只能下载一页，以后有空完善吧

结果图片

ChenTianSaber

关注

0
点赞
踩
0

收藏

觉得还不错? 一键收藏
0
评论
Python——用爬虫下载妹子图

import urllib.requestimport redef agentIp(): url='http://www.kuaidaili.com/' html=urllib.request.urlopen(url) content=html.read().decode('utf-8') pat=re.compile(r'(((2[0-5][0-5]|1[0-9]
复制链接

扫一扫