爬虫之淘宝抓包法
案例一(数据格式处理)
import urllib.request
#url = 'https://image.baidu.com/search/detail?ct=503316480&z=0&ipn=d&word=%E9%9F%A9%E5%95%86%E8%A8%80%E5%A3%81%E7%BA%B8&hs=2&pn=0&spn=0&di=41910&pi=0&rn=1&tn=baiduimagedetail&is=0%2C0&ie=utf-8&oe=utf-8&cl=2&lm=-1&cs=1904897900%2C1084212529&os=2553811481%2C1788484320&simid=3433783175%2C509998897&adpicid=0&lpn=0&ln=30&fr=ala&fm=&sme=&cg=&bdtype=0&oriquery=%E9%9F%A9%E5%95%86%E8%A8%80%E5%A3%81%E7%BA%B8&objurl=http%3A%2F%2Fimgboys1.yohobuy.com%2Fcmsimg01%2F2018%2F12%2F03%2F09%2F31%2F01edc98fd3de8e80ba1cdb9becfe372254.jpeg&fromurl=ippr_z2C%24qAzdH3FAzdH3Fooo_z%26e3By5i5k7y_z%26e3Bv54AzdH3F27wg2AzdH3FgjofAzdH3Fl80b8_mla8n_8_z%26e3Bip4s&gsm=0&islist=&querylist='
url='https://suggest.taobao.com/sug?area=b2c&code=utf-8&k=1&src=tmall_h5&q=%E8%A1%AC%E8%A1%AB%E5%A5%B3%E7%9F%AD%E8%A2%96%20%E6%A3%89%E9%BA%BB'
response=urllib.request.urlopen(url)
html=response.read()
html=html.decode('utf-8')
html
运行结果如下:
import requests
strhtml=requests.get(url)
print