不多说,先上勘误代码
# 链家经纪人爬虫实现
import requests
import csv
import time
from lxml import etree
def csv_writer(item):
with open('csvFile/lianjia_broker.csv', 'a', encoding='gbk') as csvfile:
writer = csv.writer(csvfile)
writer.writerow(item)
def spider(list_url):
headers = {'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
'AppleWebKit/537.36 (KHTML, like Gecko) '
'Chrome/72.0.3626.96 Safari/537.36'}
response = requests.get(list_url, headers=headers)
time.sleep(5)
sel = etree.HTML(response.text)
agent_list = sel.xpath('//li[@class="pictext flexbox '
'box_center_v lazyload_ulog"]/div'
'[@class="post_ulog agent_index&#