立即学习:https://edu.csdn.net/course/play/6861/326754?utm_source=blogtoedu
爬虫数据抓取练习-红牛公司信息
import requests
import re
import bs4
import pandas as pd
url = r'http://www.redbull.com.cn/about/branch'
respones = requests.get(url)
company = re.findall('<h2>(.*?)</h2>',respones.text)
add = re.findall("<p class=\'mapIco\'>(.*?)</p>",respones.text)
soup = bs4.BeautifulSoup(respones.text)
mail = [i.text for i in soup.findAll(name = 'p',attrs ={'class':'mailIco'})]
tel = [i.text for i in soup.findAll(name = 'p',attrs ={'class':'telIco'})]
pd.DataFrame({'company':company,'add':add,'mail':mail,'tel':tel})