抖音偷取用户信息

import re
import requests                      # 1.导入模块,re是正则表达式的第三方库,requests是基于阿帕奇的http协议库
url = 'https://live.douyin.com/webcast/ranklist/audience/?aid=6383&app_name=douyin_web&live_id=1&device_platform=web&language=zh-CN&enter_from=web_search&cookie_enabled=true&screen_width=1920&screen_height=1080&browser_language=zh-CN&browser_platform=Win32&browser_name=Edge&browser_version=113.0.1774.50&webcast_sdk_version=2450&room_id=7237816730813336381&anchor_id=993608293421127&sec_anchor_id=MS4wLjABAAAA_ob1997uEJAZ51gjn6kN706yOtYggr6FQxBboTbI2pA&rank_type=30&msToken=5Cc8kV9KODfPR_jorcxP0nPWxhKUDUjOSVhipckvFtpNydhFmVtBs_S76zWzIgMv7YMRGYTlifdI-kj0TdCiBo5bh3KyRFzPWczIz1KI5FI8j0oUa_FikUqbYGS9lm4=&X-Bogus=DFSzswVYHwzANSpAtS6G45ppgiml&_signature=_02B4Z6wo000017qkhpwAAIDCT9tsAgpX0j-6pIIAAIrhLNic5Ze2.lFHeKEfsH-xTKzR51UWWVrc6GoFrgM1Iezl.uaKOj34buNoIAmgEXTCNQzrxpA39cm4G42oI9qKCEidNcHveQQO5eV119'

wz = {'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/113.0.0.0 Safari/537.36 Edg/113.0.1774.50', 'cookie': 'ttwid=1%7CcrxT25oSFumki-2Ta4ueKyX3Z8SvtDtkDufRNiiQQXw%7C1685013185%7Cdcb0f739aa6d47fd77386132aa3a4f308c2559c9c36860a53c7a02145e03e8b9; passport_csrf_token=6604e6842e786bbe89dfef74ee881b04; passport_csrf_token_default=6604e6842e786bbe89dfef74ee881b04; passport_assist_user=Cjz51d8V9KJLKPhzhJtm4aIFhRRN9vt4JSqMvt1JzORHUo7ljeOY0d21Xpxc9cGKqIQHI3I9Y1ww-BVm53saSAo8ie8TxNB_vi1BI_mhBt7igKlJo8FMcKwU0HRb2-_I_tb9ZyEJvmUHSSmN-Mtpvlq_VVG_Ycn9dwISgza4EMyJsg0Yia_WVCIBA1kHxCE%3D; n_mh=-vHs5ZUkL9X2DgWA6Rj8WI61Wi7mEl9l679KgRxPqWc; sso_uid_tt=8255a9bb10d0d0600379edea561bda18; sso_uid_tt_ss=8255a9bb10d0d0600379edea561bda18; toutiao_sso_user=f40f782de7181df45d041be556699f32; toutiao_sso_user_ss=f40f782de7181df45d041be556699f32; sid_ucp_sso_v1=1.0.0-KDJiMGY4ZGRjNDA3ZmU5MDExMGFkZDZmYjMwYjNiNWMyN2QxN2ZkYWMKHQj1kKWC3QIQ1oa9owYY7zEgDDDLw8HUBTgGQPQHGgJsZiIgZjQwZjc4MmRlNzE4MWRmNDVkMDQxYmU1NTY2OTlmMzI; ssid_ucp_sso_v1=1.0.0-KDJiMGY4ZGRjNDA3ZmU5MDExMGFkZDZmYjMwYjNiNWMyN2QxN2ZkYWMKHQj1kKWC3QIQ1oa9owYY7zEgDDDLw8HUBTgGQPQHGgJsZiIgZjQwZjc4MmRlNzE4MWRmNDVkMDQxYmU1NTY2OTlmMzI; odin_tt=003e6398505fd24130a636b3d3066721f29cfedbe03a8935c6dad16d24a51e8882de24ac2dfeee028dfb61643d3e00f4; passport_auth_status=f4785783056673705c688823f924eec9%2C; passport_auth_status_ss=f4785783056673705c688823f924eec9%2C; uid_tt=a3d63a0faf2ea36d78edc307d371c241; uid_tt_ss=a3d63a0faf2ea36d78edc307d371c241; sid_tt=94a06e63409ab75c0ba172f5bf04f9c9; sessionid=94a06e63409ab75c0ba172f5bf04f9c9; sessionid_ss=94a06e63409ab75c0ba172f5bf04f9c9; publish_badge_show_info=%220%2C0%2C0%2C1685013345019%22; LOGIN_STATUS=1; store-region=cn-hn; store-region-src=uid; sid_guard=94a06e63409ab75c0ba172f5bf04f9c9%7C1685013346%7C5183991%7CMon%2C+24-Jul-2023+11%3A15%3A37+GMT; sid_ucp_v1=1.0.0-KGFiMWUzODI1OGVlYzcxZDNjN2NhZWIxMWM0NDhjMDZlYTExMmFmMWEKGQj1kKWC3QIQ4oa9owYY7zEgDDgGQPQHSAQaAmxxIiA5NGEwNmU2MzQwOWFiNzVjMGJhMTcyZjViZjA0ZjljOQ; ssid_ucp_v1=1.0.0-KGFiMWUzODI1OGVlYzcxZDNjN2NhZWIxMWM0NDhjMDZlYTExMmFmMWEKGQj1kKWC3QIQ4oa9owYY7zEgDDgGQPQHSAQaAmxxIiA5NGEwNmU2MzQwOWFiNzVjMGJhMTcyZjViZjA0ZjljOQ; d_ticket=0404255ce461d4454bf7df513e6b36547c12b; __live_version__=%221.1.0.9614%22; SEARCH_RESULT_LIST_TYPE=%22single%22; ttcid=91da48e6e53a45a5a603d03e9b902ed542; xgplayer_user_id=452553914154; download_guide=%223%2F20230525%22; pwa2=%223%7C0%22; strategyABtestKey=%221685185446.916%22; VIDEO_FILTER_MEMO_SELECT=%7B%22expireTime%22%3A1685790298748%2C%22type%22%3A1%7D; FOLLOW_NUMBER_YELLOW_POINT_INFO=%22MS4wLjABAAAASI2CwQgXnN8K1EAMWpExImmColM3l2oObDxHT3_s0kI%2F1685203200000%2F0%2F1685185499047%2F0%22; device_web_cpu_core=20; device_web_memory_size=8; webcast_local_quality=origin; csrf_session_id=82e4d4868e5a5f30ab4d862b47a0a545; webcast_leading_last_show_time=1685185544962; webcast_leading_total_show_times=1; FOLLOW_LIVE_POINT_INFO=%22MS4wLjABAAAASI2CwQgXnN8K1EAMWpExImmColM3l2oObDxHT3_s0kI%2F1685203200000%2F1685185586003%2F1685185540122%2F0%22; __ac_nonce=06471eb16007a567fc906; __ac_signature=_02B4Z6wo00f01tj5HiQAAIDDLYb0uxd12g7Y2RqAANJc3JGnomGGJYl40fJ2OBnERg7KFi3ZCm2fmdBksZZNzJ2SjvzvlDQxt0x0z6hkIZZ7dgFesqJwqhh-qUxU8URVyskP1rteHQJrGO1y0d; passport_fe_beating_status=true; home_can_add_dy_2_desktop=%221%22; live_can_add_dy_2_desktop=%221%22; msToken=_i7Mm6SQl0j_YmRAKEH8qD4qpmp1u_laP91g8AKPKGaKaJV6h4qxIWIRejcVv-zI4Ox73HTFRk85HxMMVSW-QNHQKfa2iWHQ3maAgapzhnbtFpYja8HiNw==; msToken=na5KTQDmcX1Xi_aIhSWQD71cvlHjNqnBrxGnZgScXBJ2SAoVb0V8XtLFFgKnvddoh6baRgMSWqWnZNw_Emjwhsthm5FpzOUo9X1azgaCzoVJHImpuDXyPjL6YEJ_kw4=; tt_scid=vTZbmBOL7jQDIzO82rhsP8dik3zwKnPO.y1Xe4s-JKAqAR-P-puykubl5z8VqYvm151e'}
#伪装自己的设备来进行爬取信息
res = requests.get(url, headers=wz)              # 3.请求网址 得到响应
编号列表 = re.findall('"sec_uid":"(.*?)","user_role":', res.text)
for 编号 in 编号列表:
    主页 = 'https://www.douyin.com/user/' + 编号
    res = requests.get(主页, headers=wz)
    昵称 = re.findall('<title data-react-helmet="true">(.*?)的主页 - ', res.text)
    抖音号 = re.findall('入驻抖音,TA的抖音号是(.*?),已有', res.text)
    print(昵称, 抖音号, 主页)
  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 打赏
    打赏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包

打赏作者

顿感小鹿

你的鼓励将是我创作的最大动力

¥1 ¥2 ¥4 ¥6 ¥10 ¥20
扫码支付:¥1
获取中
扫码支付

您的余额不足,请更换扫码支付或充值

打赏作者

实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值