python selenium爬虫豆瓣_python每日一题：使用selenium爬虫豆瓣电影信息

最新推荐文章于 2024-04-04 00:57:56 发布

weixin_39752087

最新推荐文章于 2024-04-04 00:57:56 发布

阅读量236

点赞数

文章标签： python selenium爬虫豆瓣

本文链接：https://blog.csdn.net/weixin_39752087/article/details/111756991

版权

#from bs4 import BeautifulSoup

import re, csv, urllib.request, urllib.parse, time, json, pickle,random

from selenium import webdriver

from selenium.webdriver.common.keys import Keys

from selenium.webdriver.common.by import By

from selenium.webdriver.support.ui import WebDriverWait

from selenium.webdriver.support import expected_conditions as EC

class managerurl(object):

def __init__(self):

self.oldurls=set()

self.newurls=set()

def add_newurls(self,urls):

if urls:

for i in urls:

self.add_newurl(i)

def add_newurl(self,url):

if url not in self.newurls and url not in self.oldurls:

self.newurls.add(url)

def has_newurls(self):

url=self.newurls.pop()

self.oldurls.add(url)

return url

class data_get(object):

def __init__(self):

self.man

确定要放弃本次机会？

福利倒计时

: :

立减 ¥

普通VIP年卡可用

关注关注