#encoding:utf-8
import urllib.request
import re
pattern = re.compile(r'卡号归属地[\s\S]*?>(.{2,3})(?= ) (.*?)</td>',re.I)
def getInfo(number):
url = "http://www.ip138.com:8080/search.asp?mobile=" + number + "&action=mobile"
data = urllib.request.urlopen(url).read().decode('gb2312')
m = pattern.search(data)
if(m):
province = m.group(1)
city = m.group(2)
#print(province,city)
return province+'\t'+city
else:
#print('无匹配值')
return '无匹配值'
file_info = open('tel_info.txt', 'w+')
for line in open('telephone.txt'):
line = line.strip()
file_info.write(line + '\t' + getInfo(line) + '\n')
file_info.close()
匹配换行符 [\s\S]
后置匹配 xx(?=xxx)