爬取12306站点信息


# -*- coding: utf-8 -*-

import ssl
import urllib2
from prettytable import PrettyTable

def get_station_name():
    url = "https://kyfw.12306.cn/otn/resources/js/framework/station_name.js?station_version=1.9025"
    
    #目的为了通过未认证的12306证书
    ssl._create_default_https_context = ssl._create_unverified_context

    req = urllib2.Request(url)
    req.add_header("Referer","https://kyfw.12306.cn/otn/leftTicket/init")
    req.add_header("User-Agent", "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3112.113 Safari/537.36")
    names = urllib2.urlopen(req).read()    
    
    with open("station_name0.txt", 'wb') as f:
        f.write(names) 
    
    itemsTmp = names.split("'")
    if len(itemsTmp) == 3:
        items = itemsTmp[1].split("@")
        
        table = PrettyTable(["序号","中文名","车站代码","中文拼音","拼音首字母"])
        table.header = True 
        table.padding_width = 2
           
        for item in items:
            if item == "":
                continue
                
            info = item.split("|")
            tr = [info[5],info[1],info[2],info[3],info[4]]
            table.add_row(tr)
                
        with open("station_name.txt", 'wb') as f:
            f.write(table.get_string()) 
            
if __name__ == "__main__":
    import sys
    reload(sys)
    sys.setdefaultencoding('utf-8')
    get_station_name()
 






  • 1
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值