2021-02-28

最新推荐文章于 2022-09-17 12:52:27 发布

阿凌sara

最新推荐文章于 2022-09-17 12:52:27 发布

阅读量405

点赞数

分类专栏： python 反扒

本文链接：https://blog.csdn.net/qq_44911774/article/details/114240114

版权

python 反扒专栏收录该内容

5 篇文章 0 订阅

订阅专栏

中医智库

接口：https://www.zk120.com/ji/read/529?nav=ys&uid=None

代码

# import requests
# source = requests.get('https://www.zk120.com/ji/content/529?uid=None&_=1614130155981').json()
# print(source)

#_*_coding:utf-8_*_
import requests
from lxml.html import etree
import json
import base64
import pyaes
import zlib
# pip install pycryptodome
from Crypto.Cipher import AES
from binascii import b2a_hex, a2b_hex
url = 'https://www.zk120.com/ji/group/?nav=ahz'
response = requests.get(url)
html = etree.HTML(response.text)
name = html.xpath("//a[@class='ellipsis']/@href")
# print(response.text)
# print(name)
for i in name:
    # print(i)
    if 'group' in i:
        src = 'https://www.zk120.com'+i
        # print(src)
        response = requests.get(src)
        # print(response.text)
        html = etree.HTML(response.text)
        urls = html.xpath("//a[@class='mr5 native_read to_reader_url']/@href")
        # print(urls)
        url_1 = 'https://www.zk120.com'
        for u in urls:
            # print(u)
            uu = u.replace('read','content')
            # print(uu)
            urll = url_1+uu
            # print(urll)
            response = requests.get(urll)
            # print(response.text)
            # 返回json数据
            con = json.loads(response.text)
            text = con['data']
            # print(text)
            # 解密
            # print len(text)%4
            # 判断这本书的内容是否是4X4规格的,如果不是的话,用=补齐16个字符
            # missing_padding = 4 - len(text) % 4
            # # print(missing_padding)
            # if missing_padding:
            #     text += '=' * missing_padding
            # 将分开的内容进行解码
            # print(text)
            content = base64.b64decode(text.encode('utf-8'))
            # print(content)
            # text = text.encode("utf-8")
            # 这里密钥key 长度必须为16（AES-128）、24（AES-192）、或32（AES-256）Bytes 长度.目前AES-128足够用
            # content= b',\x0bc\x17\xa3d\xb1+\xeb%_\x15:H\xab\x84'
            # print(content)
            # print(len(content))
            decryptor = AES.new(b"61581af471b166682a37efe6",AES.MODE_CFB, b"c8f203fca312aaab", segment_size=128)
            decrypt_text = decryptor.decrypt(content)
            # print(11111111111111111111111111111111111111111,decrypt_text,str(decrypt_text, 'utf8'))
            # aes = pyaes.AESModeOfOperationCFB(key=b"61581af471b166682a37efe6", iv=b"c8f203fca312aaab", segment_size=16)
            # aes_text = aes.encrypt(content)

            # print(22222222222222222222222222222222222222222,aes_text)
            # 解压缩
            text_zip = json.loads(zlib.decompress(decrypt_text))
                           # 输出结果
            text_code = text_zip.get("text").encode("utf-8", "ignore")
            print(str(text_code, encoding='utf-8'))

            # with open('zhongyi.txt', 'a+', encoding='utf-8') as f:
            #     f.write(str(text_code, encoding='utf-8'))



                     # 'https://www.zk120.com/ji/content/529?uid=None&_=1523528905719'
            #
            # 'https://www.zk120.com/ji/read/529?nav=ahz&uid=None'


        # ur = 'https://www.zk120.com'+'/ji/read/529?nav=ahz&amp;uid=None'
        # print(ur)