Python3之爬虫中回调函数的简单应用

import re
from multiprocessing import Pool

import requests


'''
<a href="/films/344264" title="战狼2" data-act="boarditem-click" data-val="{movieId:344264}">战狼2</a>'''
movie_pattern = re.compile(r'}">(.*?)</a></p>\n<p class="star">(.*?)</p>')


def get_page(url):
    res = requests.get(url).text
    return {'url': url, 'res': res}


def deal_data(res):
    print(res['url'], res['res'])
    movie_name = movie_pattern.findall(res['res'])
    with open('movie_info.txt', 'a', encoding='utf-8') as f:
        # print(movie_name)
        for item in movie_name:
            moviename, mainstar = item
            f.write('电影:%s,%s\n' % (moviename, mainstar))


if __name__ == '__main__':
    urls = [
        'http://maoyan.com/board/7',
        'http://maoyan.com/board/6',
        'http://maoyan.com/board/1',
        'http://maoyan.com/board/2',
        'http://maoyan.com/board/4',

    ]
    p = Pool(4)
    for url in urls:
        p.apply_async(get_page, args=(url,), callback=deal_data)

    p.close()
    p.join()
  • 0
    点赞
  • 1
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值