#在网页上爬取json数据
import requests
import json
import pymysql
moveList=[]
#获取数据库连接
con=pymysql.connect(
#主机名
host='127.0.0.1',
port=3306,
user='root',
password='root',
charset='utf8',
db='homework'
)
#爬取json数据
for page in range(2):
url="https://movie.douban.com/j/search_subjects?type=movie&tag=%E7%83%AD%E9%97%A8&sort=recommend&page_limit=20&page_start={}".format(page*20)
print(url)
data=requests.get(url).text
for ele in json.loads(data).get("subjects"):
moveList.append(ele)
print(moveList)
#数据库操作
cursor=con.cursor()
sql="insert into movies(title,url,cover) values('%s','%s','%s')"
for ele in moveList:
cursor.execute(sql % (ele['title'],ele['url'],ele['cover']))
con.commit()
cursor.close()
con.close()
使用Django框架做的web爬虫demo:https://download.csdn.net/download/hi_sir_destroy/11388170