一、通过HtmlPage获取标题
例如:
String htmlcode = "<HTML><HEAD><TITLE>AAA</TITLE></HEAD><BODY>我是中国人!</BODY></HTML>"; //模拟网页基本格式
Parser parser = Parser.createParser(htmlcode, "GBK"); //解析网页
HtmlPage page = new HtmlPage(parser);
parser.visitAllNodesWith(page);
String str=page.getTitle(); //获取标题,此处也可获取body之间的内容,str即为网页的标题
二、通过TitleTag获取标题
ObjectFindingVisitor visitor = new ObjectFindingVisitor(TitleTag.class);
Parser p = new Parser(resourse);
p.setEncoding("gb2312");
p.visitAllNodesWith(visitor);
Node[] nodes= visitor.getTags();
System.out.println(nodes.length);
for (int i = 0; i < nodes.length; i++)
{
// TittleTag
TitleTag tittleLink = (TitleTag) nodes[i]; //转换为titletag
System.out.println("Tittle = " + tittleLink.getTitle()); // 获取title
}
}
例如:
String htmlcode = "<HTML><HEAD><TITLE>AAA</TITLE></HEAD><BODY>我是中国人!</BODY></HTML>"; //模拟网页基本格式
Parser parser = Parser.createParser(htmlcode, "GBK"); //解析网页
HtmlPage page = new HtmlPage(parser);
parser.visitAllNodesWith(page);
String str=page.getTitle(); //获取标题,此处也可获取body之间的内容,str即为网页的标题
二、通过TitleTag获取标题
ObjectFindingVisitor visitor = new ObjectFindingVisitor(TitleTag.class);
Parser p = new Parser(resourse);
p.setEncoding("gb2312");
p.visitAllNodesWith(visitor);
Node[] nodes= visitor.getTags();
System.out.println(nodes.length);
for (int i = 0; i < nodes.length; i++)
{
// TittleTag
TitleTag tittleLink = (TitleTag) nodes[i]; //转换为titletag
System.out.println("Tittle = " + tittleLink.getTitle()); // 获取title
}
}