辽宁考公报名统计脚本
合并xls,统计岗位要求和报名人数
自用,仅供学习参考
import xlrd
import csv
import re
i1 = []
fp1 = xlrd.open_workbook('1.2022年度丹东市考试录用公务员职位信息表.xls')
table = fp1.sheets()[0]
nrows = table.nrows
for i in range(0,nrows):
data = table.row_values(i, start_colx=0, end_colx=None)
i1.append(data)
print(i1)
print()
i2 = []
with open('职位统计.xls') as fp2:
data = csv.reader(fp2)
for i in data:
r = '<td>(.*?)</td>'
l = re.findall(r,i[0])
if not len(l) == 0:
i2.append(l)
print(i2)
print()
with open('out.csv','w',newline='')as f:
csv_write=csv.writer(f,dialect='excel')
csv_write.writerow(i1[0])
l = i1[1]
l.append('报名人数')
csv_write.writerow(l)
for i in i1[2:]:
num = '未查到'
for j in i2:
# 由于文本回车可能导致判断偏差,已处理
if i[1].replace('\n','') == j[0].replace('\n','') and i[4].replace('\n','') == j[1].replace('\n',''):
num = j[2]
break
i.append(num)
print(i)
csv_write.writerow(i)