在我们将数据在如mysql前,需要将环境配置配置好。目前说明下python环境下需要安装的包:
mysql安装指南
参考:https://blog.csdn.net/wdh1255/article/details/90695145
需要安装 pymysql
执行:pip install pymysql
import pymysql#导入连接的模块
db = pymysql.connect("localhost","root","root","mysql")
cursor = db.cursor()
cursor.execute("DROP TABLE IF EXISTS movies")
sql = """CREATE TABLE movies (
file CHAR(200) NOT NULL,
zy CHAR(200),
times CHAR(200) )"""
cursor.execute(sql)
以下是将数据插入数据库:
insert_colmn = ("INSERT INTO movies(file, zy, times)" "VALUES(%s,%s,%s)")
data_colmn = (file, zy, times)
cursor.execute(insert_colmn, data_colmn)
db.commit()#提交
下面是整个脚本:
from lxml import etree
import requests
import pymysql
db = pymysql.connect("localhost","root","root","mysql")
cursor = db.cursor()
cursor.execute("DROP TABLE IF EXISTS movies")
sql = """CREATE TABLE movies (
file CHAR(200) NOT NULL,
zy CHAR(200),
times CHAR(200) )"""
cursor.execute(sql)
for tb in range(1):
url='https://maoyan.com/board/4?offset={}'.format(tb*10)
date=requests.get(url).text
s=etree.HTML(date)
file=s.xpath('//*[@id="app"]/div/div/div[1]/dl/dd')
for di in file:
file=di.xpath('./div/div/div[1]/p[1]/a/@title')[0].strip()
zy =di.xpath('./div/div/div[1]/p[2]/text()')[0].strip()
times=di.xpath('./div/div/div[1]/p[3]/text()')[0].strip().strip("上映时间:")
#time.sleep(1)#每一秒跳出一个结果
insert_colmn = ("INSERT INTO movies(file, zy, times)" "VALUES(%s,%s,%s)")
data_colmn = (file, zy, times)
cursor.execute(insert_colmn, data_colmn)
db.commit()
# print("{} {} {}".format(file,zy,times))