#encoding:utf-8
#注意编码格式要为utf-8,否则会编码错误
text1 = ‘’’ xxxxx’’’
text1 = text1.split(“rank-list-wrap”)[1]#切割,扔掉前面的会对数据清晰造成影响的文字
#print(text1)
for i in range(0,100):
text = text1.split(’’)[i]#分块切割
#print(text)
rank = text.split(‘data-rank=’)[1].split(’"’)[1].split(’"’)[0]#获取排名
title = text.split(‘title">’)[1].split(’<’)[0]#获取标题
play_number = text.split(‘b-icon play">’)[1].split(’’)[0].strip()#获取播放量
author = text.split(‘b-icon author">’)[1].split(’<’)[0].strip()#获取UP主
grade = text.split(‘pts">
’)[1].split(’<’)[0]#获取综合评分
print(“排名{},《{}》”.format(rank,title, play_number, author, grade))
结果如下:
print(“排名{},《{}》”.format(rank,title, play_number, author, grade))
结果如下: