import requests
import os
def geturllist(queue):
url = 'https://www.ximalaya.com/revision/play/album?albumId=3423007&pageNum=1&sort=-1&pageSize=30'
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.84 Safari/537.36',
'Referer': 'https://www.ximalaya.com/youshengshu/3423007/',
'Cookie': 'Hm_lvt_4a7d8ec50cfd6af753c4f8aee3425070=1534755334; Hm_lpvt_4a7d8ec50cfd6af753c4f8aee3425070=1534762050',
}
response = requests.get(url, headers=headers)
res_dict = response.json()
# print(res_str)
# print(type(res_str))
for m4a_ob in res_dict['data']['tracksAudioPlay']:
url_m = m4a_ob['src']
# save to queue
queue.put(url_m)
# res_m = requests.get(url=url_m,headers=headers)
# with open('test.m4a','wb') as f:
# f.write(res_m.content)
# break
def download_r(url):
url_m4a = url
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.84 Safari/537.36',
'Referer': 'https://www.ximalaya.com/youshengshu/3423007/',
'Cookie': 'Hm_lvt_4a7d8ec50cfd6af753c4f8aee3425070=1534755334; Hm_lpvt_4a7d8ec50cfd6af753c4f8aee3425070=1534762050',
}
res_m = requests.get(url=url_m4a, headers=headers)
filename = url_m4a.split('/')[-1]
if not os.path.exists('download'):
os.mkdir('download')
with open('download/' + filename, 'wb') as f:
f.write(res_m.content)
if __name__ == '__main__':
from multiprocessing import Queue
from multiprocessing import Pool
import multiprocessing
queue = Queue()
p = multiprocessing.Process(target=geturllist, args=(queue,))
p.start()
download_pool = Pool(5)
for i in range(0, 10):
print(i)
url_m4a = queue.get()
download_pool.apply_async(download_r, (url_m4a,))
download_pool.close()
download_pool.join()
p.join()
利用队列及多进程下载音频文件
最新推荐文章于 2024-04-29 20:19:35 发布