##################
# -- coding: utf-8 --
####@author: Conan_ft 2021.11.28
import requests
import bs4
from bs4 import BeautifulSoup
header = {
‘User-Agent’: ‘Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.55 Safari/537.36’}
# init_page = requests.get(url, headers=header).content
def get_one_page(url):
res=requests.get(url,headers=header)
soup=BeautifulSoup(res.text,‘html.parser’)
result=[]
for i in soup.find_all(‘div’,attrs={‘class’:‘shell-resblock-card’}):
h_text=[]
description= i.find(‘h2’).text
location= i.find(‘div’,attrs={‘class’:‘location’}).text
price=i.find(‘div’,attrs={‘price’}).text
h_text=[description,location,price]
result.append(h_text)
return result
url=‘https://m.lianjia.com/cd/loupan/fang/gaoxin7/pg’
h_info=[]
for page in range(1,8):
sw=get_one_page(url+str(page))
h_info=h_info+sw
print(page,‘done’)
o=’’
for k in h_info:
for w in k:
o+=str(w)+’ ‘+’\t’
o+=’\n’
f=open(’/Users/Conan/Desktop/study/python_deal/lianjia_cd.txt’,‘w’,encoding=‘utf-8’)
f.write(o)
f.close()