帮别人写爬虫,先是单线程,太慢,改了多线程
1.单线程
import urllib
import urllib.request
import requests
import xlwt
import re
import string
def set_style(name,height,bold=False):
style = xlwt.XFStyle() # 初始化样式
font = xlwt.Font() # 为样式创建字体
font.name = name # 'Times New Roman'
font.bold = bold
font.color_index = 4
font.height = height
style.font = font
return style
index=0
r=0
wdk=xlwt.Workbook()
sheet1=wdk.add_sheet('sheet1',cell_overwrite_ok=True) #excel单元格名字
row=['招聘职位','月薪','学历要求','工作经验','应聘要求','工作单位']
for i in row:
sheet1.write(r,index,i)
index+=1
r+=1
import datetime
starttime = datetime.datetime.now()
for pn in range(0,200,20):
url = 'http://zhaopin.baidu.com/quanzhi?tid=4139&ie=utf8&oe=utf8&query=%E6%95%