lucene 结合数据库做搜索

package jdbc;

import java.sql.Connection;

import java.sql.DriverManager;

import java.sql.PreparedStatement;

import java.sql.SQLException;

import java.util.UUID;

public class ConnectionUtil {

    private static String driver="com.mysql.cj.jdbc.Driver";

    private static String url="jdbc:mysql://localhost:3306/solrdb?useUnicode=true&characterEncoding=UTF-8&useSSL=false&serverTimezone=UTC&rewriteBatchedStatements=true";

    private static String user="root";

    private static String password="123456";

    public static Connection getConn() {

        try {

            Class.forName(driver);

            Connection conn=DriverManager.getConnection(url, user, password);

            return conn;

        } catch (ClassNotFoundException e) {

            // TODO Auto-generated catch block

            e.printStackTrace();

        } catch (SQLException e) {

            // TODO Auto-generated catch block

            e.printStackTrace();

        }

        return null;

    }

    public void CreateData() {

        Connection conn=getConn();

        try {

        PreparedStatement ps=conn.prepareStatement

                ("insert into paper (id,name,title,author,content) values (?,?,?,?,?)");

        for(int i=0;i<100;i++) {

            ps.setString(1,UUID.randomUUID().toString());

            ps.setString(2,"专家233"+i);

            ps.setString(3,"杭州九次人大会议"+i);

            ps.setString(4,"记者");

            ps.setString(5, "北京时间2019-2-13日,杭州市举行了人大代表会议,会议决定现在...."+i);

            ps.executeUpdate();

        }

        System.out.println("执行完毕");

        } catch (SQLException e) {

            e.printStackTrace();

        }

    }

    public static void main(String[] args) {

        ConnectionUtil util=new ConnectionUtil();

        util.CreateData();

    }

}

//本类只为造数据

package jdbc;

import java.io.IOException;

import java.nio.file.Files;

import java.nio.file.Path;

import java.nio.file.Paths;

import java.sql.Connection;

import java.sql.PreparedStatement;

import java.sql.ResultSet;

import java.sql.SQLException;

import java.util.ArrayList;

import java.util.Date;

import java.util.List;

import org.apache.lucene.analysis.Analyzer;

import org.apache.lucene.analysis.standard.StandardAnalyzer;

import org.apache.lucene.document.Document;

import org.apache.lucene.document.Field;

import org.apache.lucene.document.FieldType;

import org.apache.lucene.index.IndexOptions;

import org.apache.lucene.index.IndexWriter;

import org.apache.lucene.index.IndexWriterConfig;

import org.apache.lucene.index.IndexWriterConfig.OpenMode;

import org.apache.lucene.store.Directory;

import org.apache.lucene.store.FSDirectory;

/**

 * Lucene 创建索引

 * @author moonxy

 *

 */

public class CreateIndexForMysql {

	public static List<Paper> CreateData() {

		Connection conn=ConnectionUtil.getConn();

		List<Paper>list=new ArrayList<Paper>();

		try {

		PreparedStatement ps=conn.prepareStatement

				("select * from paper ");

		ResultSet rs=ps.executeQuery();

		         //4.处理数据库的返回结果(使用ResultSet类)

		         while(rs.next()){

		            Paper paper=new Paper(rs.getString("id"),

		            		rs.getString("name"), rs.getString("title"),

		            		rs.getString("author"),rs.getString("content"));

		            list.add(paper);

		         }

		System.out.println("执行完毕");

		return list;

		} catch (SQLException e) {

			e.printStackTrace();

		}

		return null;

	}

    public static void main(String[] args) {

        // 创建3个News对象

        // 开始时间

        Date start = new Date();

        System.out.println("**********开始创建索引**********");

        // 创建IK分词器

        Analyzer analyzer = new StandardAnalyzer();

        IndexWriterConfig icw = new IndexWriterConfig(analyzer);

        // CREATE 表示先清空索引再重新创建

        icw.setOpenMode(OpenMode.CREATE);

        Directory dir = null;

        IndexWriter inWriter = null;

        // 存储索引的目录

        Path indexPath = Paths.get("indexdir");

        try {

            if (!Files.isReadable(indexPath)) {

                System.out.println("索引目录 '" + indexPath.toAbsolutePath() + "' 不存在或者不可读,请检查");

                System.exit(1);

            }

            dir = FSDirectory.open(indexPath);

            inWriter = new IndexWriter(dir, icw);

//自己设置字段索引类型

            // 设置ID索引并存储

            FieldType idType = new FieldType();

            idType.setIndexOptions(IndexOptions.DOCS);

            idType.setStored(true);

            // 设置标题索引文档、词项频率、位移信息和偏移量，存储并词条化

            FieldType titleType = new FieldType();

            titleType.setIndexOptions(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS_AND_OFFSETS);

            titleType.setStored(true);

            titleType.setTokenized(true);

            FieldType contentType = new FieldType();

            contentType.setIndexOptions(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS_AND_OFFSETS);

            contentType.setStored(true);

            contentType.setTokenized(true);

            contentType.setStoreTermVectors(true);

            contentType.setStoreTermVectorPositions(true);

            contentType.setStoreTermVectorOffsets(true);

            List<Paper>list=CreateData();

            for(int i=0;i<list.size();i++) {

            	 Document doc = new Document();

            	 doc.add(new Field("id", list.get(i).getId(), idType));

            	 doc.add(new Field("title", list.get(i).getTitle(), titleType));

            	 inWriter.addDocument(doc);

            }

//

//            doc1.add(new Field("id", String.valueOf(news1.getId()), idType));

//            doc1.add(new Field("title", news1.getTitle(), titleType));

//            doc1.add(new Field("content", news1.getContent(), contentType));

//            doc1.add(new IntPoint("reply", news1.getReply()));

//            doc1.add(new StoredField("reply_display", news1.getReply()));

//

//            Document doc2 = new Document();

//            doc2.add(new Field("id", String.valueOf(news2.getId()), idType));

//            doc2.add(new Field("title", news2.getTitle(), titleType));

//            doc2.add(new Field("content", news2.getContent(), contentType));

//            doc2.add(new IntPoint("reply", news2.getReply()));

//            doc2.add(new StoredField("reply_display", news2.getReply()));

//

//            Document doc3 = new Document();

//            doc3.add(new Field("id", String.valueOf(news3.getId()), idType));

//            doc3.add(new Field("title", news3.getTitle(), titleType));

//            doc3.add(new Field("content", news3.getContent(), contentType));

//            doc3.add(new IntPoint("reply", news3.getReply()));

//            doc3.add(new StoredField("reply_display", news3.getReply()));

//            inWriter.addDocument(doc1);

//            inWriter.addDocument(doc2);

//            inWriter.addDocument(doc3);

            inWriter.commit();

            inWriter.close();

            dir.close();

        } catch (IOException e) {

            e.printStackTrace();

        }

        Date end = new Date();

        System.out.println("索引文档用时:" + (end.getTime() - start.getTime()) + " milliseconds");

        System.out.println("**********索引创建完成**********");

    }

}

　　//以上为构建索引代码

///查询代码

package query;

import java.io.IOException;

import java.nio.file.Path;

import java.nio.file.Paths;

import org.apache.lucene.analysis.Analyzer;

import org.apache.lucene.analysis.standard.StandardAnalyzer;

import org.apache.lucene.document.Document;

import org.apache.lucene.index.DirectoryReader;

import org.apache.lucene.index.IndexReader;

import org.apache.lucene.queryparser.classic.ParseException;

import org.apache.lucene.queryparser.classic.QueryParser;

import org.apache.lucene.queryparser.classic.QueryParser.Operator;

import org.apache.lucene.search.IndexSearcher;

import org.apache.lucene.search.Query;

import org.apache.lucene.search.ScoreDoc;

import org.apache.lucene.search.TopDocs;

import org.apache.lucene.store.Directory;

import org.apache.lucene.store.FSDirectory;

/**

 * 单域搜索

 * @author moonxy

 *

 */

public class QueryParseTest {

    public static void main(String[] args) throws ParseException, IOException {

        // 搜索单个字段

        String field = "title";

        // 搜索多个字段时使用数组

        //String[] fields = { "title", "content" };

        Path indexPath = Paths.get("indexdir");

        Directory dir = FSDirectory.open(indexPath);

        IndexReader reader = DirectoryReader.open(dir);

        IndexSearcher searcher = new IndexSearcher(reader);

        Analyzer analyzer = new StandardAnalyzer();//最细粒度分词

        QueryParser parser = new QueryParser(field, analyzer);

        // 多域搜索

        //MultiFieldQueryParser multiParser = new MultiFieldQueryParser(fields, analyzer);

        // 关键字同时成立使用 AND, 默认是 OR

        parser.setDefaultOperator(Operator.AND);

        // 查询语句

    //    Query query = parser.parse("农村学生");//查询关键词

        Query query = parser.parse("次人");//查询关键词

        System.out.println("Query:" + query.toString());

        // 返回前10条

        TopDocs tds = searcher.search(query, 100);

        for (ScoreDoc sd : tds.scoreDocs) {

            // Explanation explanation = searcher.explain(query, sd.doc);

            // System.out.println("explain:" + explanation + "\n");

            Document doc = searcher.doc(sd.doc);

           // System.out.println("DocID:" + sd.doc);

           // System.out.println("id:" + doc.get("id"));

            System.out.println("title:" + doc.get("title"));

         //   System.out.println("content:" + doc.get("content"));

          //  System.out.println("文档评分:" + sd.score);

        }

        dir.close();

        reader.close();

    }

}

注意我用的是MySQL 8.0 其他版本的自行更改对应的driverClass url

lucene 结合数据库做搜索的更多相关文章

Lucene.net站内搜索—6、站内搜索第二版
目录 Lucene.net站内搜索—1.SEO优化 Lucene.net站内搜索—2.Lucene.Net简介和分词Lucene.net站内搜索—3.最简单搜索引擎代码Lucene.net站内搜索—4 ...
Lucene.net站内搜索—4、搜索引擎第一版技术储备（简单介绍Log4Net、生产者消费者模式）
目录 Lucene.net站内搜索—1.SEO优化 Lucene.net站内搜索—2.Lucene.Net简介和分词Lucene.net站内搜索—3.最简单搜索引擎代码Lucene.net站内搜索—4 ...
Lucene.net站内搜索—3、最简单搜索引擎代码
目录 Lucene.net站内搜索—1.SEO优化 Lucene.net站内搜索—2.Lucene.Net简介和分词Lucene.net站内搜索—3.最简单搜索引擎代码Lucene.net站内搜索—4 ...
Lucene.net站内搜索—2、Lucene.Net简介和分词
目录 Lucene.net站内搜索—1.SEO优化 Lucene.net站内搜索—2.Lucene.Net简介和分词Lucene.net站内搜索—3.最简单搜索引擎代码Lucene.net站内搜索—4 ...
Lucene.net站内搜索—1、SEO优化
目录 Lucene.net站内搜索—1.SEO优化 Lucene.net站内搜索—2.Lucene.Net简介和分词Lucene.net站内搜索—3.最简单搜索引擎代码Lucene.net站内搜索—4 ...
使用Lucene.net提升网站搜索速度整合记录
1.随着网站数据量达到500万条的时候,发现SQL数据库如果使用LIKE语句来查询,总是占用CPU很忙,不管怎么优化,速度还是上不来; 2.经过网上收集资料,HUBBLE.net目前虽然做得不错,但需 ...
Lucene5.5.4入门以及基于Lucene实现博客搜索功能
前言一直以来个人博客的搜索功能很蹩脚,只是自己简单用数据库的like %keyword%来实现的,所以导致经常搜不到想要找的内容,而且高亮显示.摘要截取等也不好实现,所以决定采用Lucene改写博客 ...
Lucene.net站内搜索—5、搜索引擎第一版实现
目录 Lucene.net站内搜索—1.SEO优化 Lucene.net站内搜索—2.Lucene.Net简介和分词Lucene.net站内搜索—3.最简单搜索引擎代码Lucene.net站内搜索—4 ...
Lucene.Net 站内搜索
Lucene.Net 站内搜索一全文检索: like查询是全表扫描(为性能杀手)Lucene.Net搜索引擎,开源,而sql搜索引擎是收费的Lucene.Net只是一个全文检索开发包(只是帮我们 ...

随机推荐

本地项目文件夹上传至个人Github
安装Git 之后到Git官网,点击Download下载,打开安装包一路按Next一切默认直至安装结束. 找到任意一个文件夹,点击鼠标右键后若出现下图的 Git Gui Here 和 Git Bash ...
django-auth组件
auth组件一.auth模块简介 auth模块是django自带的用户认证模块,包含了身份验证和权限管理两部分. 身份验证用于核实某个用户是否合法,权限管理用于决定一个合法用户有哪些权限默认情况下 ...
Linux从入门到入门
一. 前言首先,在你的Windows系统上要想有linux系统,那就必须先安装一款软件,这里提供的是14.15的,还有ISO镜像:VMware-workstation 安装VMware:略新建虚拟 ...
成环的概率dp(初级) zoj 3329
原题地址:https://vjudge.net/problem/ZOJ-3329 题目大意: 有三个骰子,分别有k1,k2,k3个面,初始分数是0.第i骰子上的分数从1道ki.当掷三个骰子的点数分别为 ...
《剑指offer》扑克牌顺子
本题来自<剑指offer> 反转链表题目: 思路: C++ Code: Python Code: 总结:
第二卷 Spring羊群理论
写在前面: 话说这天小迦罗在和哑圣观察者聊天时,哑圣谈到自己比较喜欢吃羊,这时候小迦罗说自己的爸爸也喜欢吃,就给哑圣老师讲了他小时候在春天里放羊的故事还有参观Spring的事情.(后面以此抛砖引玉可以 ...
zookeeper（1）-简单介绍
参考: https://www.cnblogs.com/wuxl360/p/5817471.html zookeeper集群搭建 zookeeper集群原理和搭建 zookeeper集群搭建3 ...
Django：django-cors-headers 报错no module named "corsheaders"
django跨域使用 pip install django-cors-headers 然后在settings文件中加上参数设置 # app配置 INSTALLED_APPS = [ 'django.c ...
记录几个爬取动态网页时的问题(下拉框，旧的元素无法获取，获取的源代码和f12看到的不一致，爬取延迟)
更新.....这个动态网页其实直接抓取ajax请求就可以了,很简单,我之前想复杂了,虽然也实现了,但是效率极低,不过没关系,就当作是对Selenium的一次学习吧 1.最近在爬取一个动态网页,其中为了 ...
代码对齐--string|stream
https://vjudge.net/contest/185301#problem/A 学习了好多新函数,只要关注每个单词的列宽就行了.自动切分太厉害了吧~ #include<iomanip&g ...

lucene 结合数据库做搜索

lucene 结合数据库做搜索的更多相关文章

随机推荐

热门专题