Lucene的其他搜索(三)

生成索引：

package com.wp.search;

import java.nio.file.Paths;

import org.apache.lucene.analysis.Analyzer;

import org.apache.lucene.analysis.standard.StandardAnalyzer;

import org.apache.lucene.document.Document;

import org.apache.lucene.document.Field;

import org.apache.lucene.document.IntField;

import org.apache.lucene.document.StringField;

import org.apache.lucene.document.TextField;

import org.apache.lucene.index.IndexWriter;

import org.apache.lucene.index.IndexWriterConfig;

import org.apache.lucene.store.Directory;

import org.apache.lucene.store.FSDirectory;

public class Indexer {

    private Integer ids[] = { 1, 2, 3 };

    private String citys[] = { "aingdao", "banjing", "changhai" };

    private String descs[] = { "Qingdao is b beautiful city.",

            "Nanjing is c city of culture.", "Shanghai is d dustling dity." };

    // 这里的descs中的Shanghai is d dustling dity这句中我让他们不出现b和c，为等下搜索准备

    private Directory dir;

    /**

     * 获取IndexWriter实例

     *

     * @return

     * @throws Exception

     */

    private IndexWriter getWriter() throws Exception {

        Analyzer analyzer = new StandardAnalyzer(); // 标准分词器

        IndexWriterConfig iwc = new IndexWriterConfig(analyzer);// 为索引配置分词器

        IndexWriter writer = new IndexWriter(dir, iwc);

        return writer;

    }

    /**

     * 生成索引

     *

     * @param indexDir

     * @throws Exception

     */

    private void index(String indexDir) throws Exception {

        dir = FSDirectory.open(Paths.get(indexDir));

        IndexWriter writer = getWriter();

        for (int i = 0; i < ids.length; i++) {

            Document doc = new Document();

            doc.add(new IntField("id", ids[i], Field.Store.YES));

            doc.add(new StringField("city", citys[i], Field.Store.YES));

            doc.add(new TextField("desc", descs[i], Field.Store.YES));

            writer.addDocument(doc); // 添加文档

        }

        writer.close();

    }

    public static void main(String[] args) throws Exception {

        new Indexer().index("D:\\lucene\\luceneIndex");

    }

}

其他搜索:

package com.wp.search;

import java.nio.file.Paths;

import org.apache.lucene.document.Document;

import org.apache.lucene.index.DirectoryReader;

import org.apache.lucene.index.IndexReader;

import org.apache.lucene.index.Term;

import org.apache.lucene.search.BooleanClause;

import org.apache.lucene.search.BooleanQuery;

import org.apache.lucene.search.IndexSearcher;

import org.apache.lucene.search.NumericRangeQuery;

import org.apache.lucene.search.PrefixQuery;

import org.apache.lucene.search.ScoreDoc;

import org.apache.lucene.search.TermRangeQuery;

import org.apache.lucene.search.TopDocs;

import org.apache.lucene.store.Directory;

import org.apache.lucene.store.FSDirectory;

import org.apache.lucene.util.BytesRef;

import org.junit.After;

import org.junit.Before;

import org.junit.Test;

public class SearchTest {

    private Directory dir;

    private IndexReader reader;

    private IndexSearcher is;

    @Before

    public void setUp() throws Exception {

        dir = FSDirectory.open(Paths.get("D:\\lucene\\luceneIndex"));// FSDirectory为专门处理目录文件的一个类

        reader = DirectoryReader.open(dir);

        is = new IndexSearcher(reader);

    }

    @After

    public void tearDown() throws Exception {

        reader.close();

    }

    /**

     * 指定项范围搜索 之前我将Shanghai is d dustling dity不出现b和c的原因，更好看结果

     *

     * @throws Exception

     */

    @Test

    public void testTermRangeQuery() throws Exception {

        TermRangeQuery query = new TermRangeQuery("desc", new BytesRef("b"

                .getBytes()), new BytesRef("c".getBytes()), true, true);// 查询满足包含b和c区间的结果

        TopDocs hits = is.search(query, 10);// 显示查询结果的最前10条数据

        for (ScoreDoc scoreDoc : hits.scoreDocs) {

            Document doc = is.doc(scoreDoc.doc);// 将查到的内容放在文档中

            System.out.println(doc.get("id"));

            System.out.println(doc.get("city"));

            System.out.println(doc.get("desc"));

        }

    }

    /**

     * 指定数字范围

     *

     * @throws Exception

     */

    @Test

    public void testNumericRangeQuery() throws Exception {

        NumericRangeQuery<Integer> query = NumericRangeQuery.newIntRange("id",

                1, 3, true, true);// 查询在id包含1到3以内的结果(包括2)

        TopDocs hits = is.search(query, 10);

        for (ScoreDoc scoreDoc : hits.scoreDocs) {

            Document doc = is.doc(scoreDoc.doc);

            System.out.println(doc.get("id"));

            System.out.println(doc.get("city"));

            System.out.println(doc.get("desc"));

        }

    }

    /**

     * 指定字符串开头搜索

     *

     * @throws Exception

     */

    @Test

    public void testPrefixQuery() throws Exception {

        PrefixQuery query = new PrefixQuery(new Term("city", "a"));// 查询城市以a开头的

        TopDocs hits = is.search(query, 10);

        for (ScoreDoc scoreDoc : hits.scoreDocs) {

            Document doc = is.doc(scoreDoc.doc);

            System.out.println(doc.get("id"));

            System.out.println(doc.get("city"));

            System.out.println(doc.get("desc"));

        }

    }

    /**

     * 多条件查询

     *

     * @throws Exception

     */

    @Test

    public void testBooleanQuery() throws Exception {

        NumericRangeQuery<Integer> query1 = NumericRangeQuery.newIntRange("id",

                1, 2, true, true);// 查询id在1和2之间的

        PrefixQuery query2 = new PrefixQuery(new Term("city", "a"));// 城市以a开头的

        BooleanQuery.Builder booleanQuery = new BooleanQuery.Builder();

        // booleanQuery.add(query1, BooleanClause.Occur.MUST_NOT);//

        // MUST_NOT表示除了

        // booleanQuery.add(query1, BooleanClause.Occur.SHOULD);// SHOULD表示或者

        booleanQuery.add(query1, BooleanClause.Occur.MUST);// MUST表示并且

        booleanQuery.add(query2, BooleanClause.Occur.MUST);

        TopDocs hits = is.search(booleanQuery.build(), 10);

        for (ScoreDoc scoreDoc : hits.scoreDocs) {

            Document doc = is.doc(scoreDoc.doc);

            System.out.println(doc.get("id"));

            System.out.println(doc.get("city"));

            System.out.println(doc.get("desc"));

        }

    }

}

Lucene的其他搜索(三)的更多相关文章

Apache Solr采用Java开发、基于Lucene的全文搜索服务器
http://docs.spring.io/spring-data/solr/ 首先介绍一下solr: Apache Solr (读音: SOLer) 是一个开源.高性能.采用Java开发.基于Luc ...
基于 Lucene 的桌面文件搜索
开源2010年,自己在学习 Lucene 时开发的一款桌面文件搜索工具,这么多年过去了,代码一直静静存放在自己的硬盘上,与其让其沉睡,不如分享出来. 这款工具带有明显的模仿 Everything 的痕 ...
Apache Lucene(全文检索引擎)—搜索
目录返回目录:http://www.cnblogs.com/hanyinglong/p/5464604.html 本项目Demo已上传GitHub,欢迎大家fork下载学习:https://gith ...
lucene学习笔记：三，Lucene的索引文件格式
Lucene的索引里面存了些什么,如何存放的,也即Lucene的索引文件格式,是读懂Lucene源代码的一把钥匙. 当我们真正进入到Lucene源代码之中的时候,我们会发现: Lucene的索引过程, ...
lucene的多种搜索2-SpanQuery
SpanQuery按照词在文章中的距离或者查询几个相邻词的查询 SpanQuery包括以下几种: SpanTermQuery:词距查询的基础,结果和TermQuery相似,只不过是增加了查询结果中单词 ...
如何使用 Lucene 做网站高亮搜索功能？
现在基本上所有网站都支持搜索功能,现在搜索的工具有很多,比如Solr.Elasticsearch,它们都是基于 Lucene 实现的,各有各的使用场景.Lucene 比较灵活,中小型项目中使用的比较多 ...
一种安全云存储方案设计（下）——基于Lucene的云端搜索与密文基础上的模糊查询
一种安全的云存储方案设计(未完整理中) 一篇老文了,现在看看错漏颇多,提到的一些技术已经跟不上了.仅对部分内容重新做了一些修正,增加了一些机器学习的内容,然并卵. 这几年来,云产品层出不穷,但其安全性 ...
Lucene建立索引搜索入门实例
第一部分:Lucene建立索引 Lucene建立索引主要有以下两步:第一步:建立索引器第二步:添加索引文件准备在f盘建立lucene文件夹,然后 ...
WebGIS中解决使用Lucene进行兴趣点搜索排序的两种思路
文章版权由作者李晓晖和博客园共有,若转载请于明显处标明出处:http://www.cnblogs.com/naaoveGIS/. 1.背景目前跟信息采集相关的一个项目提出了这样的一个需求:中国银行等 ...

随机推荐

Logging - MVC Using Log4net Save to File and Database
第一步:创建Config文件夹和log4net.config 第二步:在log4net.confg黏贴以下配置 <?xml version="1.0" encoding=&q ...
F - Count the Colors ZOJ - 1610 线段树染色（染区间映射）
题意:给一段0-8000的线段染色问最后颜色x 有几段题解:标准线段树但是没有push_up 最后查询是单点按顺序查询每一个点考虑过使用区间来维护不同的线段有多少种各色的线段思路是 ...
洛谷P2858奶牛零食题解
题目这个题一开始能看出来是一道动态规划的题目,但是并不知道如何写状态转移方程,但是我们可以想一想这个题应该是一道区间DP,而区间DP的特点就是状态转移方程一般跟该区间的左节点和右节点或者中间断点有关 ...
IDEA @Contract annotation
IDEA @Contract annotation ----------------------------------- http://www.jetbrains.com/help/idea/con ...
[WC2018]州区划分(FWT)
题目描述题解这道题的思路感觉很妙. 题目中有一个很奇怪的不合法条件,貌似和后面做题没有什么关系,所以我们先得搞掉它. 也就是判断一个点集是否合法,也就是判断这个点集是否存在欧拉回路. 如果存在欧拉 ...
在JSON中遇到的一些坑
今天在进行压测的时候,由于需要使用到json进行传参,并且需要在JMeter中加入少量的JSON,由于JSON在java中呈现键值对的形式,并且需要使用到“”来修饰,导致只能使用\进行转义,在发送请求 ...
C语言中的类型转换——将字符串s转换为整数型(int)类型
在讲类型转换之前,我们先要理解下C语言中单引号和双引号的区别. 先讲双引号,双引号就是字符串,我们要证实我们的想法,我选择写一段代码看看开: #include <stdio.h> int ...
nio 阻塞非阻塞同步异步
https://mp.weixin.qq.com/s/5SKgdkC0kaHN495psLd3Tg 说在前面上篇NIO相关基础篇二,主要介绍了文件锁.以及比较关键的Selector,本篇继续NIO相 ...
java 判断元素是否在数组内
一,先转为List,再使用contains()方法 String[] strArr = new String[] { "a", "b", "c&quo ...
【洛谷P4144】大河的序列
题目大意:给定一个长度为 N 的序列,求序列中连续区间最大的(或和加与和)是多少. 题解: 引理:任意两个数 \(i, j\),若 \(i>j\),则在二进制表示下,i 对应的二进制串的字典序一 ...

Lucene的其他搜索(三)

Lucene的其他搜索(三)的更多相关文章

随机推荐

热门专题