fofa爬虫（python）

绝情且小帅

于 2024-08-20 09:43:03 发布

阅读量193

点赞数 2

文章标签：爬虫 python 开发语言

本文链接：https://blog.csdn.net/qq_74925081/article/details/141347316

版权

import requests
import base64
from lxml import etree
import time


search_data=''                //要爬取的内容
headers={
    # 'cookie':'你的cookie'
}
for yeshu in range(1,6):
    url='https://fofa.info/result?page='+str(yeshu)+'&qbase64='
    search_data_bs=str(base64.b64encode(search_data.encode("utf-8")),"utf-8")
    urls=url+search_data_bs
    print(urls)
    try:
        print('正在提取第'+str(yeshu)+'页')
        result=requests.get(urls,headers=headers).content
        # print(result.decode('utf-8'))
        soup=etree.HTML(result)

        ip_data=soup.xpath('//a[@target="_blank"]/@href')

        ipdata='\n'.join(ip_data)
        print(ip_data)
        with open(r'thinkphp5.txt','a+') as f:
            f.write(ipdata+'\n')
            f.close()
        time.sleep(0.5)
    except Exception as e:
        pass