网址检查
import urllib.request
import time
import os
import datetime
opener = urllib.request.build_opener()
opener.addheaders = [(‘User-agent’, ‘Mozilla/49.0.2’)]
#这个是你放网址的文件名,改过来就可以了
file = open(‘E:\脚本\py\test.txt’)
#logfile = open(“E:py\log\url.txt”, “a+”)
lines = file.readlines()
aa=[]
for line in lines:
temp=line.replace(’\n’,’’)
aa.append(temp)
print(aa)
print(‘开始检查:’)
for a in aa:
tempUrl = a
try :
opener.open(tempUrl)
logfile = open(“E:\py\log\url.txt”, “a+”)
print(tempUrl+‘没问题’)
logfile.write(tempUrl+‘没问题’+’\n’)
print(datetime.datetime.now().strftime(’%Y-%m-%d %H:%M:%S’)+’\n’)
logfile.write(datetime.datetime.now().strftime(’%Y-%m-%d %H:%M:%S’)+’\n’)
logfile.write("************************"+’\n’)
logfile.flush()
#logfile.write(print(tempUrl+‘没问题’)+’\n’)
#logfile.close
except urllib.error.HTTPError:
print(tempUrl+’=访问页面出错’)
time.sleep(2)
except urllib.error.URLError:
print(tempUrl+’=访问页面出错’)
time.sleep(2)
time.sleep(0.1)