Python后台抓取,C#客户端展示
待抓取网站及数据内容如下
:
东方财富网
http://emweb.securities.eastmoney.com/CoreConception/Index?type=web&code=sh601390
下的核心题材
http://emweb.securities.eastmoney.com/ShareholderResearch/Index?type=web&code=SH601390#
股东研究 下的 十大流通股东 十大股东
同花顺
http://basic.10jqka.com.cn/601390/company.html
公司资料 下的 参股控股公司
http://basic.10jqka.com.cn/601390/concept.html
概念题材下的 常规题材、新兴概念、其他概念、题材要点
import baostock as bs
import pandas as pd
from urllib.request import urlopen
from bs4 import BeautifulSoup
from selenium import webdriver
from selenium.webdriver.common.by import By
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
from selenium.webdriver.common.desired_capabilities import DesiredCapabilities
from phantomjs_bin import executable_path
import time
from datetime import timedelta, datetime
import ctypes
import sqlite3
import traceback
import os
print (os.getcwd()) #获取当前工作目录路径
# 设置浏览器请求头
dcap = dict(DesiredCapabilities.PHANTOMJS)
dcap["phantomjs.page.settings.userAgent"] = (
"Mozilla/5.0 (Linux; Android 5.1.1; Nexus 6 Build/LYZ28E) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/48.0.2564.23 Mobile Safari/537.36")
driver = webdriver.PhantomJS(executable_path=executable_path, desired_capabilities=dcap)
def main():
conn = sqlite3.connect('stockInfo.db')
c = conn.cursor()
stockName = "永泰能源"
stockCode='600157'
insertData=getWebData(stockCode)
try:
#raise TypeError('类型错误')
sqltext="INSERT INTO '" + stockName + "(" + stockCode + ")' (dfcfHxtc,dfcfSdl