这段代码,是在优酷看的一段解析美团网xml的视频的代码;视频清晰度不高,但是讲的条理很清晰,特别喜欢,感谢原作者!
#用python解析xml
#xml可扩展标记语言
# tag. tag.attribute 属性 tag.text
#china ,14;us 12.1
# <population>
# <country>
# china
# </country>
#</population>
# 树状结构 tree
# deals
# data data data data
# deal shops
#遍历一棵树
import xml.etree.ElementTree as ET
#写一个类
class MeituanParser:
def __int__(self):
self.meituan_deal_set=[]
def parser(self,filepath):
#load xml file
tree=ET.parser(filepath)
#get root element
root=tree.getroot()
for data in root.iter('data'):
#1,deal id
#2,salse number
#3,price
deal=data.find('deal')
meituan_dic={}
if deal is not None:
try:
meituan_dic["deal_id"]=deal.find('deal_id').text
except Exception,exp:
print('no deal_id')
try:
meituan_dic["salse_num"]=int(deal.find('salse_num').text)
except Exception,exp:
print('no deal_id')
try:
meituan_dic["deal_price"]=float(deal.find('deal_price').text)
except Exception,exp:
print('no deal_id')
self.meituan_deal_set.append[meituan_dic]
return self.meituan_deal_set
if __name__ == '__main__':
praser=MeituanParser()
deals=parser.parser('meituan.txt')