import BookItem
def parse(self, response, **kwargs):
tables=response.xpath(’//table’)
for t in tables:
tit=t.css(‘div.pl2 a::attr(title)’).extract()[0]
pu=t.css(‘p.pl::text’).extract()[0]
pu=pu.split(’/’)[-3].strip()
items
class BookItem(scrapy.Item):
file=open(‘result.txt’,‘a+’,encoding=‘utf-8’)
file.write(item[‘title’]+’,’+item[‘pub’]+’\n’) return item
读取文件
df=pd.read_csv(‘result.txt’,names=[‘title’,‘pub’])
result=df[‘pub’].value_counts().head()
print(result)
plt.pie(result,labels=result.index,autopct=’%3.1f%%’)
plt.show()