python csdn增加访问量

python csdn增加访问量

  主方法

# -*- coding:utf-8 -*-
import urllib.request, http.cookiejar, re
import time
import threading
# tools是我的自定义工具类
import tools

'''
模拟访问博客增加访问量
'''


class Csdn(threading.Thread):
    'csdn增加访问量'
    headers = [('host', 'blog.csdn.net'),
               ('User-Agent',
                'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/45.0.2454.101 Safari/537.36'),
               ]
    domain = 'http://blog.csdn.net'
    url = 'http://blog.csdn.net/%s/article/list/%s'

    def __init__(self, username, page):
        threading.Thread.__init__(self)
        self.username = username
        self.createOpener()
        self.page = page

    @staticmethod
    def getListPages(username):
        '获取总页数'
        Csdn.headers.append(('Referer', 'http://blog.csdn.net/' + username))
        cookie = http.cookiejar.CookieJar()
        cookieProc = urllib.request.HTTPCookieProcessor(cookie)
        opener = urllib.request.build_opener(cookieProc)
        opener.addheaders = Csdn.headers
        url = Csdn.url % (username, 1)
        response = opener.open(url)
        contents = contents = response.read().decode('utf-8', 'ignore')
        pattern = r'<div id="papelist" class="pagelist">([\s\S]*?)共(\d+)页'
        match = re.search(pattern, contents)
        pages = int(match.group(2))
        return pages

    def createOpener(self):
        cookie = http.cookiejar.CookieJar()
        cookieProc = urllib.request.HTTPCookieProcessor(cookie)
        opener = urllib.request.build_opener(cookieProc)
        opener.addheaders = Csdn.headers
        self.opener = opener

    def visitUrl(self):
        '访问列表页获取内容'
        opener = self.opener
        url = Csdn.url % (self.username, self.page)
        response = opener.open(url)
        self.contents = contents = response.read().decode('utf-8', 'ignore')
        self.addVisitNum()

    def addVisitNum(self):
        opener = self.opener
        contents = self.contents
        divPattern = r'<div id="article_list" ([\s\S]*)<div id="papelist" class="pagelist">'
        ulMatch = re.search(divPattern, contents)
        divText = ulMatch.group(1)
        smallPattern = r'<div class="list_item article_item">([\s\S]*?)<span class="link_title"><a href="(.*?)">([\s\S]*?)</a></span>([\s\S]*?)阅读</a>\((\d+)\)'
        match = re.findall(smallPattern, divText)
        for i in match:
            list = {'url': Csdn.domain + i[1], 'name': i[2].strip(), 'num': i[4]}
            opener.open(list['url'])
            print(self.page, list['url'])

    def run(self):
        '线程主方法'
        self.visitUrl()


@tools.runTime
def main():
    '主方法'
    # csdn昵称
    username = 'digyso888'
    pages = Csdn.getListPages(username)
    threads = []
    for page in range(1, pages + 1):
        thread = Csdn(username, page)
        thread.start()
        threads.append(thread)
    # 等待所有线程完成
    for t in threads:
        t.join()
    print("退出主线程")


if __name__ == '__main__':
    main()


import time

'''
自定义工具方法,tools.py
'''


def runTime(func):
    '记录程序运行时间'

    def newFunc(*args, **kwargs):
        start = time.clock()
        res = func(*args, **kwargs)
        end = time.clock()
        print("read: %f s" % (end - start))
        return res

    return newFunc


def log(content, file='test.log', type=1):
    if type == 1:
        f = open(file, 'a+', encoding='utf-8')
    else:
        f = open(file, 'w+', encoding='utf-8')
    f.write(content)


s


  • 0
    点赞
  • 2
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值