监控证监会公告、证监会令、证券业协会自律规则更新信息,通过企业微信机器人推送最新内容到终端。
源代码如下:
from bs4 import BeautifulSoup
from selenium import webdriver
from selenium.webdriver.chrome.options import Options
import requests
import re
import time
import os
class CsrcSpider(object):
def __init__(self, *arg):
self.url = 'http://www.csrc.gov.cn/' + str(arg[0])
self.chrome_options = Options()
self.chrome_options.add_argument('--headless')
self.driver = webdriver.Chrome(executable_path='../file/chromedriver.exe', options= self.chrome_options)
self.pre_href = 'http://www.csrc.gov.cn/pub/zjhpublic/'
self.p_href = '<a href="../../(.*?)"'
self.p_title = '<a href="../../.*?target="_blank.*?">(.*?)</a>'
self.p_fbrq = '<li class="fbrq" title=".*?">(.*?)</li>'
self.p_wh = '<li class="wh" title=".*?">(.*?)</li>'
self.lasttitle = ''
self.picurl = 'https://timgsa.baidu.com/timg?image&quality=80&size=b9999_10000&sec=1591000028969&di=fcff5ed28372c20a919cdbdba509febf&imgtype=0&src=http%3A%2F%2Fg.hiphotos.baidu.com%2Fbaike%2Fpic%2Fitem%2F08f790529822720e82e8705071cb0a46f21fab72.jpg'
def get_url(self):
self.driver.get(self