小米应用商店的爬虫,提取各个App的下载链接。
源码:
# -*- coding: UTF-8 -*-
import requests
import csv
import queue
class XiaoMiShop():
def __init__(self, category):
self.base_url = 'http://app.mi.com/categotyAllListApi'
self.base_download = 'http://app.mi.com/download/'
self.header = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.88 Safari/537.36'
self.csv_header = ['ID', '应用名称', '下载链接']
self.max_page = 70
self.category = category
self.queue = queue.Queue()
def clean_data(self, data):
'''
提取数据,放入队列中
:param data:
:return:
'''
for i in data:
app = {
}
app['ID'] = i.get