一个DOM解析类

public class RssParser { private int currentstate = -1; private boolean isItemTAG = false; private RssItem rssItem; private RssFeed rssFeed; final int TITLE = 1; final int LINK = 2; final int DESCRIPTION = 3; final int PUBDATE = 4; public void ParserRss(String url) throws Exception { XmlPullParserFactory xmlPullParserFactory = XmlPullParserFactory.newInstance(); xmlPullParserFactory.setNamespaceAware(true); XmlPullParser xmlPullParser = xmlPullParserFactory.newPullParser(); URL urlAddress = new URL(url); xmlPullParser.setInput(urlAddress.openStream(), "gbk"); int eventType = xmlPullParser.getEventType(); while (eventType != xmlPullParser.END_DOCUMENT) { if (eventType == xmlPullParser.START_DOCUMENT) { System.out.println("start Document..."); rssFeed = new RssFeed(); } else if (eventType == xmlPullParser.END_DOCUMENT) { System.out.println("end Document..."); } else if (eventType == xmlPullParser.START_TAG) { if (xmlPullParser.getName().equals("item")) { rssItem = new RssItem(); isItemTAG = true; } if (xmlPullParser.getName().equals("title")) { currentstate = TITLE; } if (xmlPullParser.getName().equals("link")) { currentstate = LINK; } if (xmlPullParser.getName().equals("description")) { currentstate = DESCRIPTION; } if (xmlPullParser.getName().equals("pubDate")) { currentstate = PUBDATE; } } else if (eventType == xmlPullParser.END_TAG) { if (xmlPullParser.getName().equals("item")) { rssFeed.addItem(rssItem); } } else if (eventType == xmlPullParser.TEXT) { if (isItemTAG) { switch (currentstate) { case TITLE: rssItem.setTitle(clearSpecialChar(xmlPullParser.getText())); currentstate = -1; break; case LINK: rssItem.setLink(clearSpecialChar(xmlPullParser.getText())); currentstate = -1; break; case DESCRIPTION: rssItem.setDescription(clearSpecialChar(xmlPullParser.getText())); currentstate = -1; break; case PUBDATE: rssItem.setPubData(clearSpecialChar(xmlPullParser.getText())); currentstate = -1; break; default: break; } } } eventType = xmlPullParser.next(); } } public RssFeed getFeed(){ return rssFeed; } private String clearSpecialChar(String s){ Pattern pattern = Pattern.compile("\\s|\\r|\\n|\\t"); Matcher matcher = pattern.matcher(s); return matcher.replaceAll("").trim(); } }
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值