Python学习笔记——20170830

BeautifulSoup

  • 安装
    • 打开cmd命令行
    • pip3 install beautifulsoup4
  • 案例一
import requests
from bs4 import BeautifulSoup
#
#
def get_html(url):
    response = requests.get(url)
    response.encoding = response.apparent_encoding
    if response.status_code == 200:
        return response.text
    else:
        print("网络访问出错")
#
#
def parse_html(html):
    soup = BeautifulSoup(html, 'lxml')
    for text in soup.select('#syncad_1 a'):
        print(text)
    print(soup.title)
    print(soup.title.string)
    print(soup.p)
    print(soup.p.name)
    print(soup.a.parent.name)
#
#
if __name__ == "__main__":

    url = "http://news.sina.com.cn"
    html = get_html(url)

    if html is not None:
        parse_html(html)
  • 案例二
import requests
from bs4 import BeautifulSoup
#
#
def get_html(url):
    response = requests.get(url)
    response.encoding = response.apparent_encoding
    if response.status_code == 200:
        return response.text
    else:
        print("网络访问出错")
#
#
def parse_html(html):
    soup = BeautifulSoup(html, 'lxml')
    yield len(soup.div.contents)
    for child in soup.div.children:
        yield child
#
#
if __name__ == "__main__":
    url = "http://music.baidu.com"
    html = get_html(url)

    if html is not None:
        for text in parse_html(html):
            print(text)
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值