import requests
import io
import sys
import xlrd
meida = '<script src="/utils.min.js"></script>'
sys.stdout = io.TextIOWrapper(sys.stdout.buffer,encoding='utf-8')
sum = 0
def findMedia(url):
global sum
r= requests.get(url)
r.encoding=None
s = r.text.find(meida)
if r.status_code != 200 or s == -1:
print(url)
sum = sum + 1
#findMedia("http://xxx.com")
mediaSheet = xlrd.open_workbook("D:\Documents\media.xlsx")
table = mediaSheet.sheets()[10]
nrows = table.nrows
urls = table.col(0, start_rowx=0, end_rowx=None)
print(urls)
for i in urls:
findMedia(i.value)
print(sum)
Python:获取url对应的页面中是否存在关键字
最新推荐文章于 2024-07-12 19:06:42 发布