1.Text和Keyword类型的区别
text: 它会为该字段的内容进行拆词操作,并放入倒排索引表中
keyword: 它不会进行拆词操作
使用match匹配查询---对匹配的关键字进行拆词操作,并和倒排索引表中对应。
使用term精准匹配---它不会对关键字进行拆词操作,而且把关键字作为一个整体和倒排索引表进行匹配
2.springboot整合ES
(1)创建一个Springboot工程并加入相关的依赖
<dependencies>
<dependency>
<groupId>com.alibaba</groupId>
<artifactId>fastjson</artifactId>
<version>1.2.75</version>
</dependency>
<dependency>
<groupId>org.springframework.boot</groupId>
<artifactId>spring-boot-starter-data-elasticsearch</artifactId>
</dependency>
<dependency>
<groupId>org.springframework.boot</groupId>
<artifactId>spring-boot-starter-web</artifactId>
</dependency>
<dependency>
<groupId>org.projectlombok</groupId>
<artifactId>lombok</artifactId>
<optional>true</optional>
</dependency>
<dependency>
<groupId>org.springframework.boot</groupId>
<artifactId>spring-boot-starter-test</artifactId>
<scope>test</scope>
</dependency>
</dependencies>
(2) 创建一个配置,获取ES工具类对象。
@Configuration
public class ESConfig {
//该对象可以对我们的ES进行相关的操作
@Bean
public RestHighLevelClient restHighLevelClient(){
RestHighLevelClient client = new RestHighLevelClient(
RestClient.builder(new HttpHost("127.0.0.1",9200,"http")));
return client;
}
}
(3)进行相关对ES操作
3.1 操作索引---创建索引
//PUT /索引名称
@Test
void testCreateIndex() throws Exception {
//该类把创建索引的信息都封装到该类中
CreateIndexRequest createIndexRequest=new CreateIndexRequest("qy151-index");
CreateIndexResponse createIndexResponse = client.indices().create(createIndexRequest, RequestOptions.DEFAULT);
System.out.println(createIndexResponse.isAcknowledged());
}
3.2 操作索引--删除索引
@Test
public void testDeleteIndex() throws Exception {
DeleteIndexRequest deleteIndexRequest=new DeleteIndexRequest("qy151-index");
AcknowledgedResponse delete = client.indices().delete(deleteIndexRequest, RequestOptions.DEFAULT);
System.out.println(delete.isAcknowledged());
}
3.3 索引操作--判断索引是否存在
@Test
public void testIndexExists() throws Exception{
GetIndexRequest getIndexRequest=new GetIndexRequest("qy151-index");
boolean exists = client.indices().exists(getIndexRequest, RequestOptions.DEFAULT);
System.out.println(exists);
}
(4)操作文档---添加文档
//添加文档--PUT /索引/1 {name:"",age:"",address:""}
@Test
public void testInsertDoc() throws Exception{
IndexRequest indexRequest=new IndexRequest("qy151-index");
indexRequest.id("1");//指定文档的id
//指定文档的内容:String文档的json内容,XContentType xContentType:以什么格式
indexRequest.source(JSON.toJSONString(new User("张三","北京",22)), XContentType.JSON);
IndexResponse indexResponse = client.index(indexRequest, RequestOptions.DEFAULT);
System.out.println(indexResponse.getResult());
}
(5)查询文档--id
//获取文档 GET /索引/_doc/1
@Test
public void testGetDoc() throws Exception{
GetRequest indexRequest=new GetRequest("qy151-index");
indexRequest.id("1");
GetResponse getResponse = client.get(indexRequest, RequestOptions.DEFAULT);
String string = getResponse.getSourceAsString();
User user = JSON.parseObject(string, User.class);
Map<String, Object> map = getResponse.getSourceAsMap();
System.out.println(map.get("address"));
}
(6)判断文档是否存在
//判断索引文档是否存在
@Test
public void testDocExist() throws Exception{
GetRequest indexRequest=new GetRequest("qy151-index");
indexRequest.id("2");
boolean exists = client.exists(indexRequest, RequestOptions.DEFAULT);
System.out.println(exists);
}
(7)删除文档
//文档操作---删除文档
@Test
public void testDeleteDoc() throws Exception{
DeleteRequest deleteRequest=new DeleteRequest("qy151-index");
deleteRequest.id("1");
DeleteResponse delete = client.delete(deleteRequest,RequestOptions.DEFAULT);
System.out.println(delete.getResult());
}
(8)修改文档
@Test
public void testUpdateDoc()throws Exception{
UpdateRequest updateRequest=new UpdateRequest("qy151-index","1");
User user = new User();
user.setName("刘德华");
updateRequest.doc(JSON.toJSONString(user), XContentType.JSON);
UpdateResponse update = client.update(updateRequest, RequestOptions.DEFAULT);
System.out.println(update.getResult());
}
(9)批量添加文档
//批量添加文档
@Test
public void testBuck() throws Exception{
BulkRequest bulk=new BulkRequest("qy151-index");
List<User> list=new ArrayList<>();
list.add(new User("2","张三","北京",22));
list.add(new User("3","张三他爸","上海",22));
list.add(new User("4","李四","杭州",22));
list.add(new User("5","李四他妈","广州",22));
list.add(new User("6","王五","南京",22));
//list.stream().forEach(item->bulk.add(new IndexRequest().id(item.getId()).source(JSON.toJSONString(item),XContentType.JSON)));
for(User user:list){
IndexRequest indexRequest=new IndexRequest();
indexRequest.id(user.getId());
indexRequest.source(JSON.toJSONString(user),XContentType.JSON);
bulk.add(indexRequest);
}
BulkResponse bulkResponse = client.bulk(bulk,RequestOptions.DEFAULT);
System.out.println(bulkResponse.hasFailures());
}
(10)复杂查询
//搜索查询---GET /索引/_search
// {
// "query":{
// "":{}
// },
// "from":
// "size":
// "_source":["",""],
// "sort":{}
// }
//1. 搜索请求对象SearchRequest
//2. 构建一个条件对象SearchSourceBuilder
//3. 把条件对象放入搜索请求对象中
//4. 执行搜索功能
@Test
public void testSearch() throws Exception{
//
SearchRequest searchRequest=new SearchRequest("qy151-index");
//创建一个条件对象
SearchSourceBuilder sourceBuilder=new SearchSourceBuilder();
TermQueryBuilder matchQuery = QueryBuilders.termQuery("name", "张");
sourceBuilder.query(matchQuery);
//分页
sourceBuilder.from(0);
sourceBuilder.size(1);
//排序
// sourceBuilder.sort("age");
//高亮
HighlightBuilder highlightBuilder=new HighlightBuilder();
highlightBuilder.field("name");
highlightBuilder.preTags("<font color='red'>");
highlightBuilder.postTags("</font>");
sourceBuilder.highlighter(highlightBuilder);
searchRequest.source(sourceBuilder);
SearchResponse searchResponse = client.search(searchRequest, RequestOptions.DEFAULT);
System.out.println("总条数:"+searchResponse.getHits().getTotalHits().value);
SearchHit[] hits = searchResponse.getHits().getHits();
Arrays.stream(hits).forEach(item-> System.out.println(item.getSourceAsString()));
Arrays.stream(hits).forEach(item-> System.out.println(item.getHighlightFields()));
}
3. 综合案例--JD搜索
导入依赖
<dependency>
<groupId>org.jsoup</groupId>
<artifactId>jsoup</artifactId>
<version>1.11.3</version>
</dependency>
package com.lpt;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.select.Elements;
import org.springframework.context.annotation.Configuration;
import java.net.URL;
public class HtmlJd {
public static void main(String[] args) throws Exception {
String path="https://search.jd.com/Search?keyword=%E6%9C%BA%E6%A2%B0%E9%9D%A9%E5%91%BD";
Document parse = Jsoup.parse(new URL(path), 30000);
Element j_searchWrap = parse.getElementById("J_searchWrap");
Elements li = parse.getElementsByTag("li");
for (Element element:li){
String text = element.getElementsByClass("p-price").eq(0).text();
String text1 = element.getElementsByClass("p-name").eq(0).text();
String img = element.getElementsByTag("img").eq(0).attr("data-lazy-img");
System.out.println(img);
}
}
}