public String getContent(String weburl) throws Exception {
// TODO Auto-generated method stub
NodeList nodelist = null;
String temp = "";
List list = new ArrayList();
Parser parser = new Parser(weburl);
//System.out.println("getUrl" + weburl);
// System.out.println(parser.getEncoding());
parser.setEncoding(parser.getEncoding());
NodeFilter filterTable = new TagNameFilter("div");
NodeFilter filterHeight = new HasAttributeFilter("class", "newsCon");
NodeFilter filterClass = new HasAttributeFilter("id", "IDNewsDtail");
NodeFilter filter = new AndFilter(new NodeFilter[] { filterTable,
filterHeight, filterClass });
nodelist = parser.extractAllNodesThatMatch(filter);
System.out.println(nodelist.toHtml());
// System.out.println("*******"+temp);
return temp;
}
抓取的另外思路
最新推荐文章于 2025-06-26 17:25:27 发布