正则匹配中文,固定形式:\u4E00-\u9FA5
re.findall("正则表达式","处理的内容",re.DOTALL)
import re
from lxml import etree
def demo():
content = """<?xml version="1.0" encoding="GB2312"?>
<tree>
<tree curCode="110000" text="北京局本部" attrsName="" attrs="" attrSplit="@#$" />
<tree curCode="120000" text="天津局本部" attrsName="" attrs="" attrSplit="@#$" />
<tree curCode="130000" text="河北局本部" attrsName="" attrs="" attrSplit="@#$" />
<tree curCode="140000" text="山西局本部" attrsName="" attrs="" attrSplit="@#$" />
<