用requests库爬取图片
Requests 库 爬取图片
1 import requests
2 import os
3 url = 'https://i0.hdslb.com/bfs/album/eddabcad0e7a8a6dc433ddd406d8b993327250 c2.jpg@518w_1e_1c.jpg'
4 root = '/home/rcx/图片/'
5 path = root + url.split('/')[-1]
6
7 try:
8 if not os.path.exists(root):
9 os.mkdir(root)
10 if not os.path.exists(path):
11 r = requests.get(url)
12 with open(path,'wb') as f:
13 f.write(r.content)
14 f.close()
15 print('图片爬取成功')
16 else:
17 print('文件已存在')
18 except:
19 print('图片爬取失败')
百度搜索 关键字接口
import requests
keyword = 'Python'
try:
kv = {'wd':keyword}
r = requests.get('http://www.baidu.com/s',params=kv)
print(r.request.url)
r.raise_for_status()
print(len(r.text))
except:
print('爬取失败')
ip地址
www.ip138.com
1 import requests
2
3 headers = {'user-agent':'Mozilla/5.0'}
4 ipaddress = '111.37.244.56'
5 root = 'http://m.ip138.com/ip.asp?ip='
6 url = root + ipaddress
7
8 try:
9 r = requests.get(url,headers=headers)
10 r.raise_for_status()
11 r.encoding = r.apparent_encoding
12 print(r.text[-500:])
13 except:
14 print('ip爬取失败')