import requests
kv={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.49'}
r=requests.get("https://item.jd.com/100041239020.html",headers=kv )
print(r.status_code)
print(r.text)
![](https://i-blog.csdnimg.cn/blog_migrate/be69b2338afb556c83ddecd87f1cddcd.jpeg)
import requests
kv={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.49'}
url='https://item.jd.com/100041239020.html'
try:
r=requests.get(url,headers=kv )
r.raise_for_status()
r.encoding=r.apparent_encoding
print(r.status_code)
print(r.text[:1000])
except:
print("爬取失败")
![](https://i-blog.csdnimg.cn/blog_migrate/0814e360a3cd618b71541451ca318800.jpeg)
import requests
# kv={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.49'}
url='https://www.amazon.cn/dp/B0BX5R554N/'
try:
r=requests.get(url)
# r.raise_for_status()
r.encoding=r.apparent_encoding
print(r.status_code)
print(r.text[:1000])
except:
print("爬取失败")
![](https://i-blog.csdnimg.cn/blog_migrate/5c3fa334ce094b02dbe9b3b72fa26730.jpeg)
![](https://i-blog.csdnimg.cn/blog_migrate/b427dcf91eb4d8f4150bb750e74c1c89.jpeg)
import requests
kv={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.49'}
url='https://www.amazon.cn/dp/B0BX5R554N/'
try:
r=requests.get(url, headers=kv)
r.raise_for_status()
# r.encoding=r.apparent_encoding
print(r.status_code)
print(r.request.headers)
print(r.text[:1000])
except:
print("爬取失败")
![](https://i-blog.csdnimg.cn/blog_migrate/8cf9bd79cc5bd1c4a5b11062738080c5.jpeg)
import requests
path = "E:\\re\\abc.jpg"
hd={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.49'}
url='http://img0.dili360.com/pic/2020/01/06/5e130172402b79y44941505_t.jpg@!rw9'
try:
r=requests.get(url, headers=hd)
r.raise_for_status()
print(r.status_code)
with open(path,'wb') as f:
f.write(r.content)
f.close()
except:
print("爬取失败")
![](https://i-blog.csdnimg.cn/blog_migrate/58aec9f9e4cbb2d909c220e875f83c0e.jpeg)
![](https://i-blog.csdnimg.cn/blog_migrate/52bc4b59a68143415603d868a548d125.jpeg)
百度不成功
# https://www.baidu.com/s?wd=keyword
# https://www.baidu.com/s?ie=utf-8&f=3&rsv_bp=1&rsv_idx=1&tn=baidu&wd=%E4%B8%AD%E5%9B%BD
# https://www.so.com/s?q=keyword
import requests
kv={'wd':'泰国'}
hd={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.49'}
url='https://www.baidu.com/s?ie=utf-8&f=3&rsv_bp=1&rsv_idx=1&tn=baidu&'
try:
r=requests.get(url, params=kv,headers=hd)
r.raise_for_status()
r.encoding=r.apparent_encoding
print(r.status_code)
print(r.request.url)
print(r.text[:1000])
except:
print("爬取失败")
会验证
![](https://i-blog.csdnimg.cn/blog_migrate/8f2c2e649d5cd480f63c845b858e055c.jpeg)
![](https://i-blog.csdnimg.cn/blog_migrate/f5d3a4e70b8380585c6963d48403e1ca.jpeg)
import requests
hd={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.49'}
ip='112.96.59.100'
url='https://www.ipshudi.com/'+ip+'.htm'
try:
r=requests.get(url, headers=hd)
r.raise_for_status()
print(r.status_code)
print(r.text[1500:3000])
except:
print("爬取失败")
![](https://i-blog.csdnimg.cn/blog_migrate/06d6749ae64db464a3860ba644a2c042.jpeg)
import requests
kv={'q':'泰国'}
hd={'user-agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/110.0.0.0 Safari/537.36 Edg/110.0.1587.49'}
url='https://www.so.com/s'
try:
r=requests.get(url, params=kv,headers=hd)
r.raise_for_status()
r.encoding=r.apparent_encoding
print(r.status_code)
print(r.request.url)
print(r.text[:1000])
except:
print("爬取失败")
![](https://i-blog.csdnimg.cn/blog_migrate/a87e8f3334c2ae056da6d80762795482.jpeg)
![](https://i-blog.csdnimg.cn/blog_migrate/b54bf97010ee5241e0f78e05731cead8.jpeg)