xinxin -爬取脑筋急转弯

import requests
url = 'https://www.2345.com/inner/jzw/'
wang_zhi = requests.get(url)
print(wang_zhi.text)
import re
tt = re.findall("""	<li><span class="table_left">(.*)点击显示答案</a></span></li>""",wang_zhi.text)
print(tt)
a = 0
for i in range(len(tt)):
    ttt = tt[a].split("""</span><span class="table_right"><a href="javascript:;" class="answer" οnclick="MM_popupMsg(""")
    print(ttt)
    a = a + 1

import requests
import re
# while True:
d = open("giao.txt", "w")
for i in range(74):
    print("正在下载%d页"%i)
    # 格式化字符串?
    url = 'https://www.2345.com/inner/jzw/%d.htm'%i
    wang_zhi = requests.get(url)
    # print(wang_zhi.text)

    tt = re.findall("""	<li><span class="table_left">(.*)点击显示答案</a></span></li>""",wang_zhi.text)
    # print(tt)
    a = 0

    for i in range(len(tt)):
        try:
            ttt = tt[a].split("""</span><span class="table_right"><a href="javascript:;" class="answer" οnclick="MM_popupMsg""")
            ttt2 = ttt[0] + ttt[1] +  "\n"
            d.write(ttt2)
            # print(ttt2)
            a = a + 1
        except:
            print("这个问题不要了")
d.close()










# 匹配术:正则表达式

# s = "saudhasjkdcsnbuckjlncuhnnasssvcnjsannasssiohvnnafssalsdjvvklnshnnbssbadkijenhueaklrhejhuea"
#
# #写一个字母藏进去,告诉我这个字母前三个字母和后三个字母nn  ss
# import re
# tt = re.findall("nn(.*)ss", s)
# print(tt)

# s = ["张飞","张跑","张跳","张飞","张跑","张跳","张飞","张跑","张跳","张飞","张跑","张跳""张飞","张跑","张跳""张飞","张跑","张跳""张飞","张跑","张跳""张飞","张跑","张跳"]
# # long ---> length 长度
# print(len(s))
# #
# a = 0
# for i in range(len(s)):
#     print(s[a])
#     a = a + 1

s = "盗墓笔记鬼吹灯明朝那些事"
# split 分割
tt = s.split("鬼")
print(tt)



  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 1
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值