要爬取表单数据,需要模拟HTTP请求,并将表单数据作为请求参数发送到网站服务器。Java中有许多库可以用来发送HTTP请求,例如Apache HttpClient、OkHttp等。
以下是使用Apache HttpClient库发送POST请求并带有表单数据的示例代码:
import org.apache.http.HttpEntity;
import org.apache.http.HttpResponse;
import org.apache.http.NameValuePair;
import org.apache.http.client.HttpClient;
import org.apache.http.client.entity.UrlEncodedFormEntity;
import org.apache.http.client.methods.HttpPost;
import org.apache.http.impl.client.HttpClientBuilder;
import org.apache.http.message.BasicNameValuePair;
import org.apache.http.util.EntityUtils;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
public class FormSubmitExample {
public static void main(String[] args) throws IOException {
HttpClient httpClient = HttpClientBuilder.create().build();
HttpPost httpPost = new HttpPost("http://example.com/submit-form");
// Add form data
List<NameValuePair> params = new ArrayList<>();
params.a