这里用的网站是腾讯证券,更详细的版本参考另一篇爬雪球网站股票:
import bs4
from bs4 import BeautifulSoup
import requests
import re
import pandas as pd
#获取网页源代码
def gethtml(url):
try:
kv = {
'User-Agent':'Mozilla/5.0'}
r = requests.get(url,headers=kv,timeout=30)
r.encoding = 'utf-8'
if r.status_code == 200:
return r.