1、首先添加依赖(maven)
<dependency>
<groupId>org.jsoup</groupId>
<artifactId>jsoup</artifactId>
<version>1.8.3</version>
</dependency>
2、记得修改package
3、代码中发送请求的类在HttpRequestUtils
package com.demo.utils;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.select.Elements;
public class CaijiUtils {
public static void main(String[] args) {
String siteUrl = "http://dt.sxgov.cn/";
String siteRule = ".text1>ul>li>a";
Elements links = responseData(siteUrl , siteRule);
for (int i = 0; i < links.size(); i++){
System.out.println("新闻标题:" + links.get(i).text());
System.out.println("连接地址:" + links.get(i).attr("href"));
String detailUrl = siteUrl + links.get(i).attr("href");
String detaulRule = "#ltext";
Elements detailPage = responseData(detailUrl , detaulRule);
System.out.println("新闻内容:" + detailPage.get(0).text());
}
}
/**
* 获取页面数据
* @param url
* @param rule
* @return
*/
public static Elements responseData(String url , String rule){
String htmlInfo = HttpRequestUtils.sendGetRequest(url);
Document doc = Jsoup.parse(htmlInfo);
return doc.select(rule);
}
}