----------简易爬虫展示农药主播人气---
import re
import urllib.request as req
URL = "https://www.panda.tv/cate/kingglory"
m = req.urlopen(URL).read()
f = str(m, "utf-8") #这是个值得注意的细节
pattern_1 = '<div class="video-info">([\w\W]*)</div>'
list_1 = re.findall(pattern_1, f)
list_2 = list_1[0].split('<a class="video-label-item label-color-0" href="/cate/kingglory">')
online = len(list_2)
pattern_2 = ' <span class="video-nickname" title="([\w\W]*?)">'
pattern_3 = '<span class="video-number">([\w\W]*?)</span>'
list_name = []
list_fame = []
list_result = []
for zb in list_2:
a = re.findall(pattern_2, zb)
b = re.findall(pattern_3, zb)
list_name.append(a)
list_fame.append(b)
for x in range(0, len(list_fame) - 1):
s1 = list_fame[x][0]
if str(s1).find("万") > 0:
s2 = str(s1).replace("万", "")
numer = int(float(s2) * 10000)
else:
numer = int(s1)
s3 = list_name[x][0]
list_result.append((numer, s3))
list_result.sort(reverse=True)
print("=" * 15, end="")
print("熊猫直播", end="")
print("=" * 15)
print("游戏:王者荣耀")
print("当前人气排行榜TOP10:")
print(" 主播 观看人数 ")
for i in range(0, 10):
print(i + 1, end=" " * (2 if i + 1 < 10 else 1))
print(list_result[i][1], end=" " * (15 - len(list_result[i][1])))
print(list_result[i][0])
-------------------------
C:\Python\Python36\python.exe D:/IdeaProjects/python_basic/extend/learn_reg.py
===============熊猫直播===============
游戏:王者荣耀
当前人气排行榜TOP10:
主播 观看人数
1 柱子z 198000
2 KPL职业联赛 83000
3 我是你绿豆哥哥 33000
4 百星东魔 26000
5 百星小莫 24000
6 熊猫Tv铭记l 13000
7 大师兄yo_ 11000
8 简单点丶无双 8170
9 panda李子 5299
10 有一块朱古力 4953
Process finished with exit code 0
熊猫TV王者荣耀主播人气TOP10
最新推荐文章于 2021-05-18 23:39:12 发布