12星座都是什么性格,大数据告诉你!
下面是利用python爬取12星座性格相关的微博,产生的12星座性格特征词云!白羊座为例,其他的在最后。
上代码(以白羊座为例):
1.微博数据爬取(需要selenium,Firefox的驱动geckodriver)
# coding=utf-8
import time
import datetime
import re
import os
import sys
import codecs
import shutil
import urllib
import random
from selenium import webdriver
from selenium.webdriver.common.keys import Keys
import selenium.webdriver.support.ui as ui
from selenium.webdriver.common.action_chains import ActionChains
import xlwt
#先调用Firefox
driver = webdriver.Firefox()
#第一步: 登陆login.sina.com
def LoginWeibo(username, password):
try:
#输入用户名/密码登录
print(u'准备登陆Weibo.cn网站...')
driver.get("https://login.sina.com.cn/signup/signin.php")
elem_user = driver.find_element_by_name("username")
elem_user.send_keys(username) #用户名
elem_pwd = driver.find_element_by_name("password")
elem_pwd.send_keys(password) #密码
elem_sub = driver.find_element_by_xpath("/html/body/div[1]/div/div[2]/div[2]/form/div[2]/div/ul/li[7]/div[1]")
elem_sub.click() #点击登陆 因无name属性
try:
#输入验证码
time.sleep(10)
elem_sub.click()
except:
#不用输入验证码
pass
print('Crawl in ', driver.current_url)
print(u'输出Cookie键值对信息:')
'''for cookie in driver.get_cookies():
print(cookie)
for key in cookie:
print(key, cookie[key])'''
print(u'登陆成功...')
except Exception as e:
print(