这里用到的数据库是用scrapy框架深度爬取(翻页)代理ip,并存入mysql数据库,打造万量级ip池
当然你有弄好的ip池也是可以的,但要改动一下代码
import pymysql
import requests
def start():
print('=======================开始啦======================')
#打开mysql
ql = pymysql.connect('localhost', 'root', 'asdfg', 'python001', charset='utf8')
cursor = ql.cursor()
mys = """select * from xicidaili where Types='HTTPS' """
addres = []
dele = []
try:
cursor.execute(mys)
results = cursor.fetchall()
for res in results:
id = res[0]
ip = res[1]
port = res[2]
ips = ip + ':' + port
iptest = {'ipaddr': 'https://' + ips}
if requests.get('http://www.baidu.com', proxies=iptest, timeout=2).status_code == 200:
addres.append(iptest)
print(str(iptest) + '\t============可用ip============')
else:
delete = """delete from xicidaili where id = %s"""
cursor.execute(delete,id)
dele.append(id)
except Exception as e:
print('出错啦:'+ str(e))
finally:
cursor.close()
ql.close()
print('++++++++++++可用ip++++++++++++++')
print(addres)
with open('proxies.txt', 'w') as op:
for proxy in addres:
op.write(str(proxy)+',\n')
print("############删除ip的id号############")
print(dele)
print('======================结束啦===========================')
start()
运行结果: