一个DOM解析类

public class RssParser {

        private int currentstate = -1;
        private boolean isItemTAG = false;

        private RssItem rssItem;
        private RssFeed rssFeed;

        final int TITLE = 1;
        final int LINK = 2;
        final int DESCRIPTION = 3;
        final int PUBDATE = 4;
        public void ParserRss(String url) throws Exception {

                XmlPullParserFactory xmlPullParserFactory = XmlPullParserFactory.newInstance();
                xmlPullParserFactory.setNamespaceAware(true);
                XmlPullParser xmlPullParser = xmlPullParserFactory.newPullParser();
                URL urlAddress = new URL(url);
                xmlPullParser.setInput(urlAddress.openStream(), "gbk");
                int eventType = xmlPullParser.getEventType();
                while (eventType != xmlPullParser.END_DOCUMENT) {
                        if (eventType == xmlPullParser.START_DOCUMENT) {
                                System.out.println("start Document...");
                                rssFeed = new RssFeed();
                        } else if (eventType == xmlPullParser.END_DOCUMENT) {
                                System.out.println("end Document...");
                        } else if (eventType == xmlPullParser.START_TAG) {
                                if (xmlPullParser.getName().equals("item")) {
                                        rssItem = new RssItem();
                                        isItemTAG = true;
                                }
                                if (xmlPullParser.getName().equals("title")) {
                                        currentstate = TITLE;
                                }
                                if (xmlPullParser.getName().equals("link")) {
                                        currentstate = LINK;
                                }
                                if (xmlPullParser.getName().equals("description")) {
                                        currentstate = DESCRIPTION;
                                }
                                if (xmlPullParser.getName().equals("pubDate")) {
                                        currentstate = PUBDATE;
                                }
                        } else if (eventType == xmlPullParser.END_TAG) {
                                if (xmlPullParser.getName().equals("item")) {
                                        rssFeed.addItem(rssItem);
                                }

                        } else if (eventType == xmlPullParser.TEXT) {
                                if (isItemTAG) {
                                        switch (currentstate) {
                                        case TITLE:
                                                rssItem.setTitle(clearSpecialChar(xmlPullParser.getText()));
                                                currentstate = -1;
                                                break;
                                        case LINK:
                                                rssItem.setLink(clearSpecialChar(xmlPullParser.getText()));
                                                currentstate = -1;
                                                break;
                                        case DESCRIPTION:
                                                rssItem.setDescription(clearSpecialChar(xmlPullParser.getText()));
                                                currentstate = -1;
                                                break;
                                        case PUBDATE:
                                                rssItem.setPubData(clearSpecialChar(xmlPullParser.getText()));
                                                currentstate = -1;
                                                break;
                                        default:
                                                break;
                                        }
                                }
                        }

                        eventType = xmlPullParser.next();
                }
        }
        
        public RssFeed getFeed(){
                return rssFeed;
        }
        
        private String clearSpecialChar(String s){
                Pattern pattern = Pattern.compile("\\s|\\r|\\n|\\t");
                Matcher matcher = pattern.matcher(s);
                return matcher.replaceAll("").trim();
        }
}

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值