lucene 4.0 - Facet demo

package com.fox.facet;

import java.io.File;

import java.io.IOException;

import java.util.ArrayList;

import java.util.Arrays;

import java.util.List;

import org.apache.lucene.analysis.Analyzer;

import org.apache.lucene.analysis.standard.StandardAnalyzer;

import org.apache.lucene.document.Document;

import org.apache.lucene.document.Field.Store;

import org.apache.lucene.document.StringField;

import org.apache.lucene.facet.index.CategoryDocumentBuilder;

import org.apache.lucene.facet.search.FacetsCollector;

import org.apache.lucene.facet.search.params.CountFacetRequest;

import org.apache.lucene.facet.search.params.FacetSearchParams;

import org.apache.lucene.facet.search.results.FacetResult;

import org.apache.lucene.facet.search.results.FacetResultNode;

import org.apache.lucene.facet.taxonomy.CategoryPath;

import org.apache.lucene.facet.taxonomy.TaxonomyReader;

import org.apache.lucene.facet.taxonomy.TaxonomyWriter;

import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyReader;

import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter;

import org.apache.lucene.index.DirectoryReader;

import org.apache.lucene.index.IndexReader;

import org.apache.lucene.index.IndexWriter;

import org.apache.lucene.index.IndexWriterConfig;

import org.apache.lucene.index.IndexWriterConfig.OpenMode;

import org.apache.lucene.index.Term;

import org.apache.lucene.search.IndexSearcher;

import org.apache.lucene.search.MultiCollector;

import org.apache.lucene.search.Query;

import org.apache.lucene.search.TermQuery;

import org.apache.lucene.search.TopScoreDocCollector;

import org.apache.lucene.store.Directory;

import org.apache.lucene.store.FSDirectory;

import org.apache.lucene.util.Version;

public class FacetingExample {

    private static final String INDEX = "d:/facet/index";

    private static final String INDEX_TAXO = "d:/facet/taxo";

    public static void main(final String[] args) throws IOException {

        Directory dir = FSDirectory.open(new File(INDEX));

        Directory taxoDir = FSDirectory.open(new File(INDEX_TAXO));

        Analyzer analyzer = new StandardAnalyzer(Version.LUCENE_40);

        IndexWriterConfig iwc = new IndexWriterConfig(Version.LUCENE_40, analyzer);

        iwc.setOpenMode(OpenMode.CREATE);

        IndexWriter writer = new IndexWriter(dir, iwc);

        TaxonomyWriter taxoWriter = new DirectoryTaxonomyWriter(taxoDir, OpenMode.CREATE_OR_APPEND);

        List<Book> books = Arrays.asList(new Book("Tom Sawyer", "Mark Twain", "1840", "Novel"), new Book("Collected Tales",

                "Mark Twain", "1850", "Novel"), new Book("The Trial", "Franz Kafka", "1901", "Novel"), new Book("Some book",

                "Some author", "1901", "Novel"));

        createDocuments(writer, taxoWriter, books);

        taxoWriter.commit();

        writer.commit();

        writer.close();

        taxoWriter.close();

        IndexReader indexReader = DirectoryReader.open(dir);

        IndexSearcher searcher = new IndexSearcher(indexReader);

        TaxonomyReader taxoReader = new DirectoryTaxonomyReader(taxoDir);

        Query q = new TermQuery(new Term("category", "Novel"));

        TopScoreDocCollector tdc = TopScoreDocCollector.create(10, true);

        FacetSearchParams facetSearchParams = new FacetSearchParams();

        facetSearchParams.addFacetRequest(new CountFacetRequest(new CategoryPath("author"), 10));

        facetSearchParams.addFacetRequest(new CountFacetRequest(new CategoryPath("category"), 10));

        facetSearchParams.addFacetRequest(new CountFacetRequest(new CategoryPath("published"), 10));

        FacetsCollector facetsCollector = new FacetsCollector(facetSearchParams, indexReader, taxoReader);

        searcher.search(q, MultiCollector.wrap(tdc, facetsCollector));

        List<FacetResult> res = facetsCollector.getFacetResults();

        System.out.println("Search for books with the category:Novel returned : " + res.size()

                + " results\n---------------------------------");

        for (final FacetResult r : res) {

            System.out.println("\nMatching " + r.getFacetResultNode().getLabel() + ":\n------------------------------------");

            for (FacetResultNode n : r.getFacetResultNode().getSubResults()) {

                System.out.println(String.format("\t%s: %.0f", n.getLabel().lastComponent(), n.getValue()));

            }

        }

    }

    private static void createDocuments(final IndexWriter writer, final TaxonomyWriter taxoWriter, final List<Book> books)

            throws IOException {

        for (final Book b : books) {

            Document doc = new Document();

            doc.add(new StringField("title", b.getTitle(), Store.YES));

            doc.add(new StringField("category", b.getCategory(), Store.YES));

            List<CategoryPath> categories = new ArrayList<CategoryPath>();

            categories.add(new CategoryPath("author", b.getAuthor()));

            categories.add(new CategoryPath("category", b.getCategory()));

            categories.add(new CategoryPath("published", b.getPublished()));

            CategoryDocumentBuilder categoryDocBuilder = new CategoryDocumentBuilder(taxoWriter);

            categoryDocBuilder.setCategoryPaths(categories);

            categoryDocBuilder.build(doc);

            writer.addDocument(doc);

        }

    }

}

class Book {

    private final String title;

    private final String author;

    private final String published;

    private final String category;

    public Book(final String title, final String author, final String published, final String category) {

        this.title = title;

        this.author = author;

        this.published = published;

        this.category = category;

    }

    public String getTitle() {

        return title;

    }

    public String getAuthor() {

        return author;

    }

    public String getPublished() {

        return published;

    }

    public String getCategory() {

        return category;

    }

}

Result

Search for books with the category:Novel returned : 3 results

---------------------------------

Matching author:

------------------------------------

    Mark Twain: 2

    Some author: 1

    Franz Kafka: 1

Matching category:

------------------------------------

    Novel: 4

Matching published:

------------------------------------

    1901: 2

    1850: 1

    1840: 1

lucene 4.0 - Facet demo的更多相关文章

Lucene 4.3 - Facet demo
package com.fox.facet; import java.io.IOException; import java.util.ArrayList; import java.util.List ...
Lucene 4.8 - Facet Demo
package com.fox.facet; /* * Licensed to the Apache Software Foundation (ASF) under one or more * con ...
lucene搜索之facet查询原理和facet查询实例——TODO
转自:http://www.lai18.com/content/7084969.html Facet说明我们在浏览网站的时候,经常会遇到按某一类条件查询的情况,这种情况尤以电商网站最多,以天猫商城为 ...
关于Lucene 3.0升级到Lucene 4.x 备忘
最近,需要对项目进行lucene版本升级.而原来项目时基于lucene 3.0的,很古老的一个版本的了.在老版本中中,我们主要用了几个lucene的东西: 1.查询lucene多目录索引. 2.构建R ...
Lucene 6.0下使用IK分词器
Lucene 6.0使用IK分词器需要修改修改IKAnalyzer和IKTokenizer. 使用时先新建一个MyIKTokenizer类,一个MyIkAnalyzer类: MyIKTokenizer ...
Lucene 4.0 正式版发布，亮点特性中文解读[转]
http://blog.csdn.net/accesine960/article/details/8066877 2012年10月12日,Lucene 4.0正式发布了(点击这里下载最新版),这个版本 ...
Android5.0(Lollipop) BLE蓝牙4.0+浅析demo连接（三）
作者:Bgwan链接:https://zhuanlan.zhihu.com/p/23363591来源:知乎著作权归作者所有.商业转载请联系作者获得授权,非商业转载请注明出处. Android5.0(L ...
vue入门 0 小demo (挂载点、模板、实例)
vue入门 0 小demo (挂载点.模板) 用直接的引用vue.js 首先讲几个基本的概念 1.挂载点即el:vue 实例化时元素挂靠的地方. 2.模板即template:vue 实例化时挂 ...
Lucene 6.5.0 入门Demo
Lucene 6.5.0 要求jdk 1.8 1.目录结构: 2.数据库环境: private int id; private String name; private float price; pr ...

随机推荐

Gym - 101981M：（南京） Mediocre String Problem（回文树+exkmp）
#include<bits/stdc++.h> #define ll long long #define rep(i,a,b) for(int i=a;i<=b;i++) using ...
Codeforces 520B：Two Buttons（思维，好题）
题目链接:http://codeforces.com/problemset/problem/520/B 题意给出两个数n和m,n每次只能进行乘2或者减1的操作,问n至少经过多少次变换后能变成m 思路 ...
php基础-4
require和include require和include都是导入外部php文件的方法,使用方法为require和include关键字后接导入包(php_file)的名字的字符串形式. 当导入的包 ...
[动态差分+二维前缀和][小a的轰炸游戏]
链接:https://ac.nowcoder.com/acm/contest/317/E来源:牛客网题目描述小a正在玩一款即时战略游戏,现在他要用航空母舰对敌方阵地进行轰炸地方阵地可以看做是n× ...
hasura graphql-engine v1.0.0-alpha30 版本新功能介绍
hasura graphql-engine v1.0.0-alpha30 发布了,以下为一些变动的简单说明破坏性的变动 order_by 中的desc 从 desc nulls last 修改为 d ...
数据格式转换（一）PDF转换技术
PDF(Portable Document Format)文件格式是Adobe公司开发的电子文件格式. 这样的文件格式与操作系统平台无关.这一特点使它成为在Internet上进行电子文档发行 ...
Debug outlook add-in (office.js) 小技巧
这几天在使用office.js 做outlook add-in的时候出现了一个问题: 不知道运行时去调试. 这里给大家介绍两个调试add-in 的方法. office365 其他软件 add-ins ...
java 实现websocket的三种方式
Java中实现websocket常见有以下三种方式: 使用tomcat的websocket实现,需要tomcat 7.x,JEE7的支持. 使用spring的websocket,spring与webs ...
flume简介
组件介绍: 代理 Flume Agent Flume内部有一个或者多个Agent 每一个Agent是一个独立的守护进程(JVM) 从客户端哪儿接收收集,或者从其他的Agent哪儿接收,然后迅速的将获取 ...
全文检索Solr集成HanLP中文分词
以前发布过HanLP的Lucene插件,后来很多人跟我说其实Solr更流行(反正我是觉得既然Solr是Lucene的子项目,那么稍微改改配置就能支持Solr),于是就抽空做了个Solr插件出来,开源在 ...

lucene 4.0 - Facet demo

lucene 4.0 - Facet demo的更多相关文章

随机推荐

热门专题