1.爬虫作业
import requests
from re import fullmatch, match, findall
reponse = requests.get('https://cd.zu.ke.com/zufang')
reponse1 = reponse.text
'''
名字特点 :整租·景茂誉府 1室1厅 东
合租·朝阳名宅 3居室 东北卧
合租·中房优山PLUS 4居室 东卧
合租·黄金时代(中和街道办吉龙二街) 4居室 南卧
有中文 有· 有空格 有数字
title="([整合独栋]+租*·.+?)">
钱特点:
<em>(\d+?)</em>
面积特点: \d+\.?\d*㎡
'''
result = \
findall(r'title="([整合独栋]+租*·.+?)">', reponse1)
money = findall(r'<em>(\d+?)</em>', reponse1)
area = findall(r'\d+\.?\d*㎡', reponse1)
for x in zip(result, money, area):
print(x)