股票信息爬取,获取股票列表,并借助股票列表获取个股具体信息!
import requests
from bs4 import BeautifulSoup
import traceback
import re
import os
import time
'''获取股票信息列表;进而获取个股信息
通过http://quote.eastmoney.com/stock_list.html获取股票信息列表
通过https://www.laohu8.com/stock/600026获取个股信息
'''
''' 通过requests库获取页面信息'''
def getHTMLText(url, code="utf-8"):
try:
r = requests.get(url)
r.raise_for_status()
r.encoding = code
return r.text
except:
return ""
'''获取股票信息列表信息'''
def getStockList(stock_url):
lst = []
html = getHTMLText(stock_url,"GB2312")
soup = BeautifulSoup(html,'html.parser')
a = soup.find_all('a',attrs={'target':'_blank'})
for i in a :
try:
href = re.findall(r"s[hz][0-9]{6}",i[