csv写入

最新推荐文章于 2024-09-30 14:16:32 发布

yhl19871003

最新推荐文章于 2024-09-30 14:16:32 发布

阅读量67

点赞数

文章标签： python

本文链接：https://blog.csdn.net/yhl19871003/article/details/120792186

版权

import csv
import os

from lxml import etree
import  requests

header={
    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36'
}

list1=[]
def get(url):

    res=requests.get(url,headers=header)
    html=etree.HTML(res.content)
    titles=html.xpath('//div[@class="pl2"]/a/@title')
    authors=html.xpath('//p[@class="pl"]/text()')
    evaluates=html.xpath('//span[@class="pl"]/text()')
    links=html.xpath('//a[@class="nbg"]/@href')
    jpgs=html.xpath('//a[@class="nbg"]/img/@src')
    for title ,author,evaluate,link ,jpg in zip(titles,authors,evaluates,links,jpgs):
        list = []
        e=evaluate
        e=e.replace('\n','').replace(" ",'')
        list.append(title)
        list.append(author)
        list.append(e)
        list.append(link)
        list1.append(list)
        print(str(list)+"开始写入")

    return list1


for n in range(0,25,25):
    url="https://book.douban.com/top250?start="+str(n)

    a=get(url)
    print(a)
    with open("douban.csv", 'w', newline="") as f:
        file = csv.writer(f)
        for cow in a:
            file.writerow(cow)



# import csv,os
# csccows=[]
# for con in os.listdir("."):
#     if con.endswith(".csv"):
#         print(con)
#         with open(".\\"+con) as f:
#             file=csv.reader(f)
#             print(type(file))
#             for cow in file:
#                 if file.line_num == 1:
#                     continue
#                 csccows.append(cow)
#             f.close()
#             print(csccows)
#             csccows.reverse()
#             with open(".\\"+con,'w',newline="") as f:
#                 file1=csv.writer(f)
#                 for cow in csccows:
#
#                         print("准备写入 "+str(cow))
#                         file1.writerow(cow)