python爬虫：爬去Json响应内容（第六感别墅度假别墅列表）学习笔记

本文链接：https://blog.csdn.net/u010035907/article/details/52895414

# -*- coding: utf-8 -*-
"""
Created on Sat Oct 22 21:01:23 2016

@author: hhxsym
"""

import requests
import json
import os

inpath="C:\\Users\\hhxsym\\Desktop\\课程群Python爬虫"
inpath = unicode(inpath , "utf8")
os.chdir(inpath) #不做编码转换后，中文路径无法打开，更改

def get_page_list(page=1):
url = 'http://www.senseluxury.com/destinations_list/77'
payload = {'page':page, 'callback':'jsonp'}
responses = requests.get(url,payload) #请求网页，获得响应的内容,requests.get(url地址，关键字url参数)
#print responses.url
print responses.status_code
#print responses.text[6:-1] #打印json格式的“字符串” (1)
wb_data = json.loads(responses.text[6:-1]) #将字符串转换为python的字典 (2)
print type(responses.text), type(wb_data) #对比两种类型 (1)(2)对比
print json.dumps(wb_data, encoding='utf-8', ensure_ascii=False) #json.dumps方法，变换成中文打印

#通过循环获取数据

for i in wb_data['val']['data']:
title = i['title']
url = 'http://www.senseluxury.com'+i['url'] #数据拼接，获得我们想要的数据
print title, url




if __name__=='__main__':
get_page_list(1)


# 网页json类型的查看：浏览器 -> 右键检查 -> network -> XHR ->页面触发(跳转页面) -> name勾选-> Response ->查看是否出现json格式字符串
# http://jsoneditoronline.org/ 在线格式化网站，查看接送嵌套格式