import requests
url = 'https://www.2345.com/inner/jzw/'
wang_zhi = requests.get(url)
print(wang_zhi.text)
import re
tt = re.findall(""" <li><span class="table_left">(.*)点击显示答案</a></span></li>""",wang_zhi.text)
print(tt)
a = 0
for i in range(len(tt)):
ttt = tt[a].split("""</span><span class="table_right"><a href="javascript:;" class="answer" οnclick="MM_popupMsg(""")
print(ttt)
a = a + 1
import requests
import re
# while True:
d = open("giao.txt", "w")
for i in range(74):
print("正在下载%d页"%i)
# 格式化字符串?
url = 'https://www.2345.com/inner/jzw/%d.htm'%i
wang_zhi = requests.get(url)
# print(wang_zhi.text)
tt = re.findall(""" <li><span class="table_left">(.*)点击显示答案</a></span></li>""",wang_zhi.text)
# print(tt)
a = 0
for i in range(len(tt)):
try:
ttt = tt[a].split("""</span><span class="table_right"><a href="javascript:;" class="answer" οnclick="MM_popupMsg""")
ttt2 = ttt[0] + ttt[1] + "\n"
d.write(ttt2)
# print(ttt2)
a = a + 1
except:
print("这个问题不要了")
d.close()
# 匹配术:正则表达式
# s = "saudhasjkdcsnbuckjlncuhnnasssvcnjsannasssiohvnnafssalsdjvvklnshnnbssbadkijenhueaklrhejhuea"
#
# #写一个字母藏进去,告诉我这个字母前三个字母和后三个字母nn ss
# import re
# tt = re.findall("nn(.*)ss", s)
# print(tt)
# s = ["张飞","张跑","张跳","张飞","张跑","张跳","张飞","张跑","张跳","张飞","张跑","张跳""张飞","张跑","张跳""张飞","张跑","张跳""张飞","张跑","张跳""张飞","张跑","张跳"]
# # long ---> length 长度
# print(len(s))
# #
# a = 0
# for i in range(len(s)):
# print(s[a])
# a = a + 1
s = "盗墓笔记鬼吹灯明朝那些事"
# split 分割
tt = s.split("鬼")
print(tt)
xinxin -爬取脑筋急转弯
最新推荐文章于 2021-12-06 23:07:28 发布