IT数码 购物 网址 头条 软件 日历 阅读 图书馆
TxT小说阅读器
↓语音阅读,小说下载,古典文学↓
图片批量下载器
↓批量下载图片,美女图库↓
图片自动播放器
↓图片自动播放器↓
一键清除垃圾
↓轻轻一点,清除系统垃圾↓
开发: C++知识库 Java知识库 JavaScript Python PHP知识库 人工智能 区块链 大数据 移动开发 嵌入式 开发工具 数据结构与算法 开发测试 游戏开发 网络协议 系统运维
教程: HTML教程 CSS教程 JavaScript教程 Go语言教程 JQuery教程 VUE教程 VUE3教程 Bootstrap教程 SQL数据库教程 C语言教程 C++教程 Java教程 Python教程 Python3教程 C#教程
数码: 电脑 笔记本 显卡 显示器 固态硬盘 硬盘 耳机 手机 iphone vivo oppo 小米 华为 单反 装机 图拉丁
 
   -> 大数据 -> SpringBoot-ElasticSearch -> 正文阅读

[大数据]SpringBoot-ElasticSearch

修改ES依赖版本与安装的ES软件版本一致

    <properties>
        <java.version>1.8</java.version>
        <!--    修改依赖的版本与安装的elasticsearch版本一致     -->
        <elasticsearch.version>7.6.2</elasticsearch.version>
    </properties>
    <dependencies>
        <dependency>
            <groupId>com.alibaba</groupId>
            <artifactId>fastjson</artifactId>
            <version>1.2.62</version>
        </dependency>
        <dependency>
            <groupId>org.springframework.boot</groupId>
            <artifactId>spring-boot-starter-data-elasticsearch</artifactId>
        </dependency>
        <dependency>
            <groupId>org.springframework.boot</groupId>
            <artifactId>spring-boot-devtools</artifactId>
            <scope>runtime</scope>
            <optional>true</optional>
        </dependency>
        <dependency>
            <groupId>org.projectlombok</groupId>
            <artifactId>lombok</artifactId>
            <optional>true</optional>
        </dependency>
        <dependency>
            <groupId>org.springframework.boot</groupId>
            <artifactId>spring-boot-starter-test</artifactId>
            <scope>test</scope>
        </dependency>
    </dependencies>

容器加入ES的高等级的 rest 风格的客户端工具类:RestHighLevelClient

@Configuration
public class Config {
    /*
    将elasticsearch客户端扫描进容器,将通过此客户端对elasticsearch进行操作
     */
    @Bean
    public RestHighLevelClient restHighLevelClient(){
        return new RestHighLevelClient(
                RestClient.builder(// 参数为 HttpHost 的数组,如果是集群的话同时写多个 HttpHost
                        new HttpHost("localhost", 9200, "http")));

    }
}

数据实体类

@Data
@AllArgsConstructor
@NoArgsConstructor
@Component
public class User {
    private String name;
    private int age;
    private double sal;
    private String birth;
}

对索引及文档的操作

@SpringBootTest
class ElasticApplicationTests {
    @Autowired
    RestHighLevelClient restHighLevelClient;

    /**
     * 对索引的操作:请求:**IndexRequest,响应:**IndexResponse
     */

    // 创建索引  CreateIndexRequest
    @Test
    void createIndex() throws IOException {
        CreateIndexRequest request = new CreateIndexRequest("muchen");
        CreateIndexResponse createIndexResponse = restHighLevelClient.indices().create(request, RequestOptions.DEFAULT);
        System.out.println(createIndexResponse);
    }

    // 获取索引,判断其是否存在  GetIndexRequest
    @Test
    void getIndex() throws IOException {
        GetIndexRequest request = new GetIndexRequest("muchen");
        // 获得索引
//        GetIndexResponse getIndexResponse = restHighLevelClient.indices().get(request, RequestOptions.DEFAULT);
        // 判断索引是否存在
        boolean exists = restHighLevelClient.indices().exists(request, RequestOptions.DEFAULT);
        System.out.println(exists);
    }

    // 删除索引  DeleteIndexRequest
    @Test
    void deleteIndex() throws IOException {
        DeleteIndexRequest request = new DeleteIndexRequest("muchen");
        AcknowledgedResponse delete = restHighLevelClient.indices().delete(request, RequestOptions.DEFAULT);
        System.out.println(delete.isAcknowledged());
    }

    // 添加文档  IndexRequest  .index
    @Test
    void addDocument() throws IOException {
        // 创建数据对象
        User user = new User("张三", 12, 9000, "2020-02-05");
        // 创建针对指定索引的请求
        IndexRequest request = new IndexRequest("muchen");
        // 设定一些规则
        request.id("1");
        request.timeout("5s");
        // 将数据对象  (json格式) 放入请求中
        request.source(JSON.toJSONString(user), XContentType.JSON);
        // 发送数据
        IndexResponse indexResponse = restHighLevelClient.index(request, RequestOptions.DEFAULT);
        System.out.println(indexResponse.toString());
    }

    // 判断文档是否存在
    @Test
    void isExistDoc() throws IOException {
        // 创建指定索引库里的指定文档请求
        GetRequest request = new GetRequest("muchen", "1");
        // 发送请求
        boolean exists = restHighLevelClient.exists(request, RequestOptions.DEFAULT);
        System.out.println(exists);
    }

    // 获取文档  GetRequest  .get
    @Test
    void getDocument() throws IOException {
        GetRequest request = new GetRequest("muchen", "1");
        GetResponse response = restHighLevelClient.get(request, RequestOptions.DEFAULT);
        System.out.println(response.getSourceAsString());
        System.out.println(response);
    }

    // 更新文档  UpdateRequest  .update
    @Test
    void updateDocument() throws IOException {
        // 创建要更新的数据对象
        User user = new User("猪刚鬣不刚烈", 100, 1999, "1799-09-09");
        // 创建指定索引里指定文档的更新请求
        UpdateRequest request = new UpdateRequest("muchen", "1");
        request.timeout("5s");
        // 将数据放入请求中
        request.doc(JSON.toJSONString(user),XContentType.JSON);
        // 发送数据
        UpdateResponse updateResponse = restHighLevelClient.update(request, RequestOptions.DEFAULT);
        System.out.println(updateResponse);
        System.out.println(updateResponse.status());
    }

    // 删除文档  DeleteRequest  .delete
    @Test
    void deleteDocument() throws IOException {
        DeleteRequest request = new DeleteRequest("muchen", "1");
        request.timeout("5s");
        DeleteResponse deleteResponse = restHighLevelClient.delete(request, RequestOptions.DEFAULT);
        System.out.println(deleteResponse);
        System.out.println(deleteResponse.status());
    }

    // 批量插入文档
    @Test
    void bulkDocument() throws IOException {
        // 创建批量请求
        BulkRequest bulkRequest = new BulkRequest();
        bulkRequest.timeout("5s");
        // 创建批量数据
        List<User> list = new ArrayList<>();
        list.add(new User("张三",13,33333,"1909-09-09"));
        list.add(new User("张三去",12,3333,"1909-09-09"));
        list.add(new User("张三我",14,9333,"1909-09-09"));
        list.add(new User("张三饿",15,33993,"1909-09-09"));
        list.add(new User("张三如律",13,6333,"1909-09-09"));
        list.add(new User("张三他",123,53333,"1909-09-09"));
        list.add(new User("张三有",3,3633,"1909-09-09"));
        // 批量数据放入请求中;不指定id则随机产生字符串Id
        for (int i = 0; i < list.size(); i++) {
            // 批量修改 UpdateRequest;批量删除 DeleteRequest
            bulkRequest.add(new IndexRequest("muchen").id("" + (i+1)).source(JSON.toJSONString(list.get(i)),XContentType.JSON));
        }
        // 发送批量请求
        BulkResponse bulkResponse = restHighLevelClient.bulk(bulkRequest, RequestOptions.DEFAULT);
        System.out.println(bulkResponse.status());
        System.out.println(bulkResponse);
    }

    // 查询
    @Test
    void searchDocument() throws IOException {
        // 创建搜索请求
        SearchRequest searchRequest = new SearchRequest("muchen");
        // 创建条件搜索构建器
        SearchSourceBuilder searchSourceBuilder = new SearchSourceBuilder();
        // 创建搜索条件
        MatchQueryBuilder matchQueryBuilder = QueryBuilders.matchQuery("name", "张");
        // 搜索条件放入搜索构建器
        searchSourceBuilder.query(matchQueryBuilder);
        searchSourceBuilder.timeout(new TimeValue(10000));
        // 搜索构建器放入搜索请求中
        searchRequest.source(searchSourceBuilder);
        // 发送请求
        SearchResponse search = restHighLevelClient.search(searchRequest, RequestOptions.DEFAULT);
        for (SearchHit hit : search.getHits().getHits()) {
            System.out.println(JSON.toJSONString(hit.getSourceAsMap()));
        }
    }
}

实例

? ? ? ? 爬取数据

        <!--  解析网页    -->
        <dependency>
            <groupId>org.jsoup</groupId>
            <artifactId>jsoup</artifactId>
            <version>1.10.2</version>
        </dependency>
public class HtmlParseUtil {

    /**
     * 为索引库爬取数据
     * @param keyword
     * @return
     * @throws IOException
     */
    public List<Content> getData(String keyword) throws IOException {
        String url = "https://search.suning.com/"+keyword+"/";
        // 解析网页,返回浏览器的 Document 对象
        Document document = Jsoup.parse(new URL(url),15000);
        // 操作 documen对象获取页面元素即可,方法就是js中对应的方法
        Element element = document.getElementById("product-list");
        Elements lis = element.getElementsByTag("li");
        List<Content> list = new ArrayList<>();
        for (Element li : lis) {
            String img = li.getElementsByTag("img").eq(0).attr("src");
            String price = JSON.parseObject(li.getElementsByClass("sellPoint").eq(0).attr("sa-data")).getString("prdid").substring(7);
            String title = li.getElementsByClass("title-selling-point").eq(0).text();
            list.add(new Content(img,price,title));
        }
        return list;
    }
}
/**
     * 爬取数据导入索引库
     * @param keyword
     * @return
     * @throws IOException
     */
    public boolean parseData(String keyword) throws IOException {
        List<Content> contentList = new HtmlParseUtil().getData(keyword);
        BulkRequest bulkRequest = new BulkRequest();
        for (Content content : contentList) {
            bulkRequest.add(new IndexRequest("su_list").source(JSON.toJSONString(content), XContentType.JSON));
        }
        BulkResponse bulkResponse = restHighLevelClient.bulk(bulkRequest, RequestOptions.DEFAULT);
        return !bulkResponse.hasFailures();
    }

查询

@Service
public class ContentService {

    @Autowired
    RestHighLevelClient restHighLevelClient;

    /**
     * 普通搜索
     * @param keyword
     * @param pageNo
     * @param pageSize
     * @return
     * @throws IOException
     */
    public List<Map<String, Object>> searchData(String keyword, int pageNo, int pageSize) throws IOException {
        SearchRequest searchRequest = new SearchRequest("su_list");
        SearchSourceBuilder searchSourceBuilder = new SearchSourceBuilder();
        // 分页
        searchSourceBuilder.from(pageNo);
        searchSourceBuilder.size(pageSize);
        // 精准匹配 termQuery
        MatchQueryBuilder termQuery = QueryBuilders.matchQuery("title", keyword);
        searchSourceBuilder.query(termQuery);
        searchSourceBuilder.timeout(new TimeValue(30000));
        searchRequest.source(searchSourceBuilder);
        SearchResponse searchResponse = restHighLevelClient.search(searchRequest, RequestOptions.DEFAULT);
        // 处理结果,数据返回
        List<Map<String, Object>> list = new ArrayList<>();
        for (SearchHit documentFields : searchResponse.getHits().getHits()) {
            list.add(documentFields.getSourceAsMap());
        }
        return list;
    }

    /**
     * 高亮搜索
     * @param keyword
     * @param pageNo
     * @param pageSize
     * @return
     * @throws IOException
     */
    public List<Map<String, Object>> searchHighLightData(String keyword, int pageNo, int pageSize) throws IOException {
        SearchRequest searchRequest = new SearchRequest("su_list");
        SearchSourceBuilder searchSourceBuilder = new SearchSourceBuilder();
        // 分页设置
        searchSourceBuilder.from(pageNo);
        searchSourceBuilder.size(pageSize);

        // 高亮设置
        HighlightBuilder highlightBuilder = new HighlightBuilder();
        // 设置要高亮的字段
        highlightBuilder.field("title");
        // 高亮字段的标签样式
        highlightBuilder.preTags("<span style='color:red;'>");
        highlightBuilder.postTags("</span>");
        // false:同时显示多个高亮
        highlightBuilder.requireFieldMatch(false);
        searchSourceBuilder.highlighter(highlightBuilder);

        // 精准匹配 termQuery
        MatchQueryBuilder termQuery = QueryBuilders.matchQuery("title", keyword);
        searchSourceBuilder.query(termQuery);
        searchSourceBuilder.timeout(new TimeValue(30000));
        searchRequest.source(searchSourceBuilder);
        SearchResponse searchResponse = restHighLevelClient.search(searchRequest, RequestOptions.DEFAULT);
        // 处理结果,数据返回
        List<Map<String, Object>> list = new ArrayList<>();
        for (SearchHit documentFields : searchResponse.getHits().getHits()) {
            Map<String, Object> sourceAsMap = documentFields.getSourceAsMap();
            // 获取高亮字段
            Map<String, HighlightField> highlightFields = documentFields.getHighlightFields();
            HighlightField title = highlightFields.get("title");
            // 将高亮字段转换成字符串,方便替换
            String highLightTitle = "";
            if(title != null){
                Text[] fragments = title.fragments();
                for (Text fragment : fragments) {
                    highLightTitle += fragment;
                }
            }
            // 替换源数据中的字段
            sourceAsMap.put("title", highLightTitle);
            list.add(sourceAsMap);
        }
        return list;
    }

}
  大数据 最新文章
实现Kafka至少消费一次
亚马逊云科技:还在苦于ETL?Zero ETL的时代
初探MapReduce
【SpringBoot框架篇】32.基于注解+redis实现
Elasticsearch:如何减少 Elasticsearch 集
Go redis操作
Redis面试题
专题五 Redis高并发场景
基于GBase8s和Calcite的多数据源查询
Redis——底层数据结构原理
上一篇文章      下一篇文章      查看所有文章
加:2021-08-07 12:09:17  更:2021-08-07 12:10:23 
 
开发: C++知识库 Java知识库 JavaScript Python PHP知识库 人工智能 区块链 大数据 移动开发 嵌入式 开发工具 数据结构与算法 开发测试 游戏开发 网络协议 系统运维
教程: HTML教程 CSS教程 JavaScript教程 Go语言教程 JQuery教程 VUE教程 VUE3教程 Bootstrap教程 SQL数据库教程 C语言教程 C++教程 Java教程 Python教程 Python3教程 C#教程
数码: 电脑 笔记本 显卡 显示器 固态硬盘 硬盘 耳机 手机 iphone vivo oppo 小米 华为 单反 装机 图拉丁

360图书馆 购物 三丰科技 阅读网 日历 万年历 2024年5日历 -2024/5/17 17:02:40-

图片自动播放器
↓图片自动播放器↓
TxT小说阅读器
↓语音阅读,小说下载,古典文学↓
一键清除垃圾
↓轻轻一点,清除系统垃圾↓
图片批量下载器
↓批量下载图片,美女图库↓
  网站联系: qq:121756557 email:121756557@qq.com  IT数码