VHT 是 Vanguard Health Care ETF
用python爬一下ticker
from selenium.webdriver.support import expected_conditions as EC
from selenium.webdriver.common.by import By
from selenium.webdriver.support.wait import WebDriverWait
from selenium import webdriver
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.common.action_chains import ActionChains
import time
from selenium.webdriver.support.ui import Select
import numpy as np
import pandas as pd
import requests
from bs4 import BeautifulSoup
import urllib.request
import re
browser = webdriver.Chrome(executable_path="/Users/xiaoyizhou/Downloads/chromedriver")
browser.get("https://www.zacks.com/funds/etf/VHT/holding")
time.sleep(3)
Select=Select(browser.find_element_by_xpath("/html/body/div[4]/div[3]/div/section[2]/div/div/div[3]/div[2]/label/select"))
Select.select_by_visible_text("100")
soup = BeautifulSoup(browser.page_source, 'html.parser')
Ticker=[]
Symbol=[]
for tr in soup.find_all('tr'):
try:
tds = tr.find_all('td')
if not tds:
pass
else:
Symbol.append(tds[1].text)
except:
pass
Symbol=Symbol[5:len(Symbol)]
Ticker=Ticker+Symbol
next=browser.find_element_by_xpath("/html/body/div[4]/div[3]/div/section[2]/div/div/div[3]/div[3]/a[2]")
time.sleep(3)
next.click()
time.sleep(3)
for i in range(3):
soup = BeautifulSoup(browser.page_source, 'html.parser')
Symbol=[]
for tr in soup.find_all('tr'):
try:
tds = tr.find_all('td')
if not tds:
pass
else:
Symbol.append(tds[1].text)
except:
pass
Symbol=Symbol[5:len(Symbol)]
Ticker=Ticker+Symbol
next=browser.find_element_by_xpath("/html/body/div[4]/div[3]/div/section[2]/div/div/div[3]/div[3]/a[2]")
time.sleep(3)
next.click()
time.sleep(3)
Ticker=pd.DataFrame({'Ticker':Ticker})
Ticker.to_csv("Ticker.csv",index=False)