python开发的著名作品-学了一个多月python了，终于有能拿得出手的作品了

最新推荐文章于 2024-05-13 09:07:57 发布

weixin_39859055

最新推荐文章于 2024-05-13 09:07:57 发布

阅读量215

点赞数

# -*- coding: utf-8 -*-

import scrapy

import json

from Taobao.items import TaobaoItem

# url编码

from urllib.parse import quote

# url解码

from urllib.parse import unquote

class TaobaoSpider(scrapy.Spider):

name = "taobao"

# allowed_domains = ["taobao.com/"]

page = input("请输入打印页数:")

Quote = input("请输入要搜索的商品名")

start_urls = ["https://ai.taobao.com/search/getItem.htm?_tb_token_=e3d450b1e33e&__ajax__=1&pid=mm_33793785_3431230_471812702&unid=&clk1=&page={}&pageSize=60&pvid=200_11.224.194.119_358_1541678031255&squareFlag=&sourceId=search&ppathName=&supportCod=&city=&ppath=&dc12=&pageNav=false&itemAssurance=&fcatName=&price=&cat=&from=&tmall=&key={}&fcat=&ppage=0&debug=false&maxPageSize=200&sort=&exchange7=&custAssurance=&postFree=&npx=50&location=".format(int(page),quote(Quote,"utf-8"))]

a = 1

def parse(self, response):

js = json.loads(response.body)["result"]["auction"]

f = open("{}.csv".format(self.Quote), "w", encoding="utf-8")

f.write("商品名,价格,店名 ")

for text in js:

dict = {

"name" : text["description"],

"nick" : text["nick"],

"realPrice" : text["realPrice"],

}

f.write("{name},{realPrice},{nick} ".format(**dict))

origPicUrl = "https:" + text["origPicUrl"]

item = TaobaoItem()

item["origPicUrl"] = origPicUrl

yield item

f.close()

if self.page != "1":

print("=" * 40 + "第" + self.page + "页下载完毕" + "=" * 40)

if self.page != "1":

for n in range(2,int(self.page)):

yield scrapy.Request("https://ai.taobao.com/search/getItem.htm?_tb_token_=e3d450b1e33e&__ajax__=1&pid=mm_33793785_3431230_471812702&unid=&clk1=&page={}&pageSize=60&pvid=200_11.224.194.119_358_1541678031255&squareFlag=&sourceId=search&ppathName=&supportCod=&city=&ppath=&dc12=&pageNav=false&itemAssurance=&fcatName=&price=&cat=&from=&tmall=&key=python%E7%BC%96%E7%A8%8B%E4%BB%8E%E5%85%A5%E9%97%A8%E5%88%B0%E5%AE%9E%E6%88%98&fcat=&ppage=0&debug=false&maxPageSize=200&sort=&exchange7=&custAssurance=&postFree=&npx=50&location=".format(n),self.parse)