找到网址源码,抓包url 分析正则
#导入模块
import re
import urllib.request
import random
#设置代理代理池 随机选取
def open_url(url):
req = urllib.request.Request(url)
req.add_header(“User-Agent”,“Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/66.0.3359.139 Safari/537.36”)
proxy_list = [
{"http":'222.188.178.42:9999'},
{"http":'163.204.243.186:9999'},
{"http":'36.99.215.29:9999'},
{"http":'120.24.173.214:80'},
{"http":'112.85.165.40:9999'},
{"http":'171.80.2.137:9999'},
{"http":'113.128.30.247:808'},
]
proxy = random.choice(proxy_list)
proxy_suopport = urllib.request.ProxyHandler(proxy)
opener = urllib.request.build_opener(proxy_suoppor