BeautifulSoup练习-豆瓣活动

from bs4 import BeautifulSoup
import requests
import mysql_test


def space_strip(tag, css):
     r = tag.select(css)[0].text.replace('\n', '').strip()
     return r


url = 'https://beijing.douban.com/events/week-party'
response = requests.get(url)

# with open('douban_events.html', 'wb') as f:
#     f.write(response.content)

soup = BeautifulSoup(response.text, 'lxml')
ul_tag = soup.find('ul', class_="events-list events-list-pic100 events-list-psmall")
li_list = ul_tag.find_all('li', class_='list-entry')
for li_tag in li_list:
    title = space_strip(li_tag, 'div.title > a > span')
    date = space_strip(li_tag, 'div.info > ul > li')
    address = space_strip(li_tag, 'div.info > ul > li:nth-of-type(2)')
    fee = space_strip(li_tag, 'div.info > ul > li:nth-of-type(3) > strong')
    owner = space_strip(li_tag, 'div.info > ul > li:nth-of-type(4) > a')
    data = (title, date, address, fee, owner)
    sql = 'insert into douban_act (title, date, address, fee, owner) values (%s, %s ,%s ,%s, %s)'
    mc = mysql_test.mysql_connect()
    mc.mysql_insert_modify(sql, data)

 

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值