java opencsv 乱码_15、解决14中csv用excel打开乱码的问题 open('zhihu.csv','w',newline='',encoding='utf-8-sig')...

1 #爬取知乎大v张佳玮的文章“标题”、“摘要”、“链接”,并存储到本地文件

2 #URL https://www.zhihu.com/people/zhang-jia-wei/posts

3

4 importrequests5 importtime6 importopenpyxl7 importcsv8

9 headers ={10 'accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3',11 'accept-language': 'zh-CN,zh;q=0.9',12 'cache-control': 'max-age=0',13 'cookie':'__DAYU_PP=iJb63REJnnjIMmBvzNMV65ab0a6aae4f; q_c1=d75d908a13c44b95bd75f27578ad2088|1521641428000|1521641428000; _zap=bec28151-809b-4936-971a-d18f5255add0; tgw_l7_route=f2979fdd289e2265b2f12e4f4a478330; _xsrf=wQDRNSLBlRv3aimMzhUNyqg1BpLUnWAr; d_c0="ABDmoGi2RQ-PTp5SSFyQvDgz_QEjeQfCFgk=|1555156366"; capsion_ticket="2|1:0|10:1555156366|14:capsion_ticket|44:MTBhN2FkYjYyNWEyNDFjYWJiYTk2N2E1YTA1NDE4OTk=|084e15694c6993269b3aab564e9ea5d7983782f4b37dbc4537e000aa7b081901"',14 'upgrade-insecure-requests': '1',15 'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.103 Safari/537.36'

16 }17

18 res = requests.get('https://www.zhihu.com/api/v4/members/zhang-jia-wei/articles?include=data%5B*%5D.comment_count%2Csuggest_edit%2Cis_normal%2Cthumbnail_extra_info%2Cthumbnail%2Ccan_comment%2Ccomment_permission%2Cadmin_closed_comment%2Ccontent%2Cvoteup_count%2Ccreated%2Cupdated%2Cupvoted_followees%2Cvoting%2Creview_info%2Cis_labeled%2Clabel_info%3Bdata%5B*%5D.author.badge%5B%3F(type%3Dbest_answerer)%5D.topics&offset=0&limit=20&sort_by=created',headers=headers)19

20 totals = res.json()['paging']['totals']21 num =022

23 #excel 表头部分

24

25 wb =openpyxl.Workbook()26 sheet =wb.active27 sheet.title = '张佳玮的文章'

28 sheet['A1'] = '编号'

29 sheet['B1'] = '标题'

30 sheet['C1'] = '创建时间'

31 sheet['D1'] = '链接'

32 sheet['E1'] = '摘要'

33

34 #csv 表头部分

35

36 with open('zhihu.csv','w',newline='',encoding='utf-8-sig') as csv_file:37 writer =csv.writer(csv_file)38 writer.writerow(['编号','标题','创建时间','链接','摘要'])39

40 for offset in range(0,21,20):41 res = requests.get('https://www.zhihu.com/api/v4/members/zhang-jia-wei/articles?include=data%5B*%5D.comment_count%2Csuggest_edit%2Cis_normal%2Cthumbnail_extra_info%2Cthumbnail%2Ccan_comment%2Ccomment_permission%2Cadmin_closed_comment%2Ccontent%2Cvoteup_count%2Ccreated%2Cupdated%2Cupvoted_followees%2Cvoting%2Creview_info%2Cis_labeled%2Clabel_info%3Bdata%5B*%5D.author.badge%5B%3F(type%3Dbest_answerer)%5D.topics&offset={}&limit=20&sort_by=created'.format(offset),headers=headers)42 html =res.json()43 items = res.json()['data']44 for item initems:45 num = num + 1

46 print(num,end='\t')47 timeArray = time.localtime(item['created'])48 print(time.strftime("%Y-%m-%d %H:%M:%S",timeArray),end='\t')49 print(item['title'])50

51 #excel 内容部分

52 sheet.append([num,item['title'],time.strftime("%Y-%m-%d %H:%M:%S",timeArray),item['url'],item['excerpt']])53

54 #csv 内容部分

55 writer.writerow([num,item['title'],time.strftime("%Y-%m-%d %H:%M:%S",timeArray),item['url'],item['excerpt']])56

57 #excel 保存到文件

58 wb.save('zhihu.xlsx')

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值