import pandas as pd
#DateFrame中,index为行索引,columns为列索引
pd.set_option('display.unicode.east_asian_width',True)
df = pd.DataFrame()
url_List = ['http://www.espn.com/nba/salaries/_/seasontype/4']
for i in range(0,13):
url = 'http://www.espn.com/nba/salaries/_/page/%s/seasontype/4'%i
url_List.append(url)
#遍历网页中的table标签读取网页表格数据
for url in url_List:
df =df.append(pd.read_html(url),ignore_index=True)
#数据解析,吧数据存入dataframe
print(df)
结果其
H:\pythonProject\venv\Scripts\python.exe H:/pythonProject/main.py
0 1 2 3
0 RK NAME TEAM SALARY
1 1 Stephen Curry, PG Golden State Warriors $45,780,966
2 2 James Harden, SG Brooklyn Nets $44,310,840
3 3 John Wall, PG Houston Rockets $44,310,840
4 4 Russell Westbrook, PG Los Angeles Lakers $44,211,146
.. ... ... ... ...
611 476 Miles McBride, PG New York Knicks $925,258
612 477 Georgios Kalaitzakis, SF Milwaukee Bucks $925,258
613 478 Brandon Boston Jr., SG LA Clippers $925,258
614 479 Luka Garza, C Detroit Pistons $925,258
615 480 Marko Simonovic, C Chicago Bulls $925,258
[616 rows x 4 columns]
进程已结束,退出代码为 0