import csv
import os
import re
import pandas as pd
import requests
import random
import time
import json
from pymysql import *
from lxml import etree
from sqlalchemy import create_engine
from datetime import datetime, timedelta
engine = create_engine('mysql+pymysql://root:root@localhost:3306/doubanmovie')
class spider(object):
def init(self):
try:
conn = connect(host='localhost', user='root', password='root', database='doubanmovie', port=3306, charset='utf8mb4')
sql = '''
create table movies(
id int primary key auto_increment,
directors varchar(2555),
rate varchar(255),
title varchar(255),
casts varchar(255),
cover varchar(255),
year varchar(255),
types varchar(255),
country varchar(255),
lang varchar(255),
time varchar(255),
movieTime varchar(255),
comment_len varchar(255),
starts varchar(255),
summary varchar(2555),
comments text,
imgList varchar(2555),
movieUrl varchar(255),
detailLink varchar(255)