ziheng - 爬取3500道脑经急转弯

import requests
import re
for ye in range(74):
	wang_zhi = "http://www.2345.com/inner/jzw/%d.htm"%ye
	yuan_dai_ma = requests.get(wang_zhi)
	# print(yuan_dai_ma.text)
	# print(type(yuan_dai_ma.text))
	# 数据类型:字典{} 列表[] 元组() 布尔表达式True/False  字符串"" 数字
	# re正则表达式:匹配术
	# # findall(查找的格式,从哪里查找)
	wen = re.findall('<li><span class="table_left">(.*)">点击显示答案</a></span></li>',yuan_dai_ma.text)
	for i in range (len(wen)):
	    # print(i)
	    # print(wen[i])
	    wenti_daan = wen[i].split(
	        """</span><span class="table_right"><a href="javascript:;" class="answer" οnclick="MM_popupMsg('""")
    	print(wenti_daan)
import requests
import re

for ye in range(75):
    print("正在下载第%d页"%ye)
    wang_zhi = "http://www.2345.com/inner/jzw/%d.htm" % ye
    yuan_dai_ma = requests.get(wang_zhi)
    wen = re.findall('<li><span class="table_left">(.*)">点击显示答案</a></span></li>', yuan_dai_ma.text)
    for i in range(len(wen)):
        wenti_daan = wen[i].split(
            """</span><span class="table_right"><a href="javascript:;" class="answer" οnclick="MM_popupMsg('""")
        # print(wenti_daan)
        try:
            f = open("jzw.txt",  "a")
            f.write("\n")
            f.write( wen[i])
            f.close()
        except:
            print('这个问题我不要了')

评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值