Lucene的其他搜索(三)

生成索引：

package com.wp.search;

import java.nio.file.Paths;

import org.apache.lucene.analysis.Analyzer;

import org.apache.lucene.analysis.standard.StandardAnalyzer;

import org.apache.lucene.document.Document;

import org.apache.lucene.document.Field;

import org.apache.lucene.document.IntField;

import org.apache.lucene.document.StringField;

import org.apache.lucene.document.TextField;

import org.apache.lucene.index.IndexWriter;

import org.apache.lucene.index.IndexWriterConfig;

import org.apache.lucene.store.Directory;

import org.apache.lucene.store.FSDirectory;

public class Indexer {

    private Integer ids[] = { 1, 2, 3 };

    private String citys[] = { "aingdao", "banjing", "changhai" };

    private String descs[] = { "Qingdao is b beautiful city.",

            "Nanjing is c city of culture.", "Shanghai is d dustling dity." };

    // 这里的descs中的Shanghai is d dustling dity这句中我让他们不出现b和c，为等下搜索准备

    private Directory dir;

    /**

     * 获取IndexWriter实例

     *

     * @return

     * @throws Exception

     */

    private IndexWriter getWriter() throws Exception {

        Analyzer analyzer = new StandardAnalyzer(); // 标准分词器

        IndexWriterConfig iwc = new IndexWriterConfig(analyzer);// 为索引配置分词器

        IndexWriter writer = new IndexWriter(dir, iwc);

        return writer;

    }

    /**

     * 生成索引

     *

     * @param indexDir

     * @throws Exception

     */

    private void index(String indexDir) throws Exception {

        dir = FSDirectory.open(Paths.get(indexDir));

        IndexWriter writer = getWriter();

        for (int i = 0; i < ids.length; i++) {

            Document doc = new Document();

            doc.add(new IntField("id", ids[i], Field.Store.YES));

            doc.add(new StringField("city", citys[i], Field.Store.YES));

            doc.add(new TextField("desc", descs[i], Field.Store.YES));

            writer.addDocument(doc); // 添加文档

        }

        writer.close();

    }

    public static void main(String[] args) throws Exception {

        new Indexer().index("D:\\lucene\\luceneIndex");

    }

}

其他搜索:

package com.wp.search;

import java.nio.file.Paths;

import org.apache.lucene.document.Document;

import org.apache.lucene.index.DirectoryReader;

import org.apache.lucene.index.IndexReader;

import org.apache.lucene.index.Term;

import org.apache.lucene.search.BooleanClause;

import org.apache.lucene.search.BooleanQuery;

import org.apache.lucene.search.IndexSearcher;

import org.apache.lucene.search.NumericRangeQuery;

import org.apache.lucene.search.PrefixQuery;

import org.apache.lucene.search.ScoreDoc;

import org.apache.lucene.search.TermRangeQuery;

import org.apache.lucene.search.TopDocs;

import org.apache.lucene.store.Directory;

import org.apache.lucene.store.FSDirectory;

import org.apache.lucene.util.BytesRef;

import org.junit.After;

import org.junit.Before;

import org.junit.Test;

public class SearchTest {

    private Directory dir;

    private IndexReader reader;

    private IndexSearcher is;

    @Before

    public void setUp() throws Exception {

        dir = FSDirectory.open(Paths.get("D:\\lucene\\luceneIndex"));// FSDirectory为专门处理目录文件的一个类

        reader = DirectoryReader.open(dir);

        is = new IndexSearcher(reader);

    }

    @After

    public void tearDown() throws Exception {

        reader.close();

    }

    /**

     * 指定项范围搜索 之前我将Shanghai is d dustling dity不出现b和c的原因，更好看结果

     *

     * @throws Exception

     */

    @Test

    public void testTermRangeQuery() throws Exception {

        TermRangeQuery query = new TermRangeQuery("desc", new BytesRef("b"

                .getBytes()), new BytesRef("c".getBytes()), true, true);// 查询满足包含b和c区间的结果

        TopDocs hits = is.search(query, 10);// 显示查询结果的最前10条数据

        for (ScoreDoc scoreDoc : hits.scoreDocs) {

            Document doc = is.doc(scoreDoc.doc);// 将查到的内容放在文档中

            System.out.println(doc.get("id"));

            System.out.println(doc.get("city"));

            System.out.println(doc.get("desc"));

        }

    }

    /**

     * 指定数字范围

     *

     * @throws Exception

     */

    @Test

    public void testNumericRangeQuery() throws Exception {

        NumericRangeQuery<Integer> query = NumericRangeQuery.newIntRange("id",

                1, 3, true, true);// 查询在id包含1到3以内的结果(包括2)

        TopDocs hits = is.search(query, 10);

        for (ScoreDoc scoreDoc : hits.scoreDocs) {

            Document doc = is.doc(scoreDoc.doc);

            System.out.println(doc.get("id"));

            System.out.println(doc.get("city"));

            System.out.println(doc.get("desc"));

        }

    }

    /**

     * 指定字符串开头搜索

     *

     * @throws Exception

     */

    @Test

    public void testPrefixQuery() throws Exception {

        PrefixQuery query = new PrefixQuery(new Term("city", "a"));// 查询城市以a开头的

        TopDocs hits = is.search(query, 10);

        for (ScoreDoc scoreDoc : hits.scoreDocs) {

            Document doc = is.doc(scoreDoc.doc);

            System.out.println(doc.get("id"));

            System.out.println(doc.get("city"));

            System.out.println(doc.get("desc"));

        }

    }

    /**

     * 多条件查询

     *

     * @throws Exception

     */

    @Test

    public void testBooleanQuery() throws Exception {

        NumericRangeQuery<Integer> query1 = NumericRangeQuery.newIntRange("id",

                1, 2, true, true);// 查询id在1和2之间的

        PrefixQuery query2 = new PrefixQuery(new Term("city", "a"));// 城市以a开头的

        BooleanQuery.Builder booleanQuery = new BooleanQuery.Builder();

        // booleanQuery.add(query1, BooleanClause.Occur.MUST_NOT);//

        // MUST_NOT表示除了

        // booleanQuery.add(query1, BooleanClause.Occur.SHOULD);// SHOULD表示或者

        booleanQuery.add(query1, BooleanClause.Occur.MUST);// MUST表示并且

        booleanQuery.add(query2, BooleanClause.Occur.MUST);

        TopDocs hits = is.search(booleanQuery.build(), 10);

        for (ScoreDoc scoreDoc : hits.scoreDocs) {

            Document doc = is.doc(scoreDoc.doc);

            System.out.println(doc.get("id"));

            System.out.println(doc.get("city"));

            System.out.println(doc.get("desc"));

        }

    }

}

Lucene的其他搜索(三)的更多相关文章

Apache Solr采用Java开发、基于Lucene的全文搜索服务器
http://docs.spring.io/spring-data/solr/ 首先介绍一下solr: Apache Solr (读音: SOLer) 是一个开源.高性能.采用Java开发.基于Luc ...
基于 Lucene 的桌面文件搜索
开源2010年,自己在学习 Lucene 时开发的一款桌面文件搜索工具,这么多年过去了,代码一直静静存放在自己的硬盘上,与其让其沉睡,不如分享出来. 这款工具带有明显的模仿 Everything 的痕 ...
Apache Lucene(全文检索引擎)—搜索
目录返回目录:http://www.cnblogs.com/hanyinglong/p/5464604.html 本项目Demo已上传GitHub,欢迎大家fork下载学习:https://gith ...
lucene学习笔记：三，Lucene的索引文件格式
Lucene的索引里面存了些什么,如何存放的,也即Lucene的索引文件格式,是读懂Lucene源代码的一把钥匙. 当我们真正进入到Lucene源代码之中的时候,我们会发现: Lucene的索引过程, ...
lucene的多种搜索2-SpanQuery
SpanQuery按照词在文章中的距离或者查询几个相邻词的查询 SpanQuery包括以下几种: SpanTermQuery:词距查询的基础,结果和TermQuery相似,只不过是增加了查询结果中单词 ...
如何使用 Lucene 做网站高亮搜索功能？
现在基本上所有网站都支持搜索功能,现在搜索的工具有很多,比如Solr.Elasticsearch,它们都是基于 Lucene 实现的,各有各的使用场景.Lucene 比较灵活,中小型项目中使用的比较多 ...
一种安全云存储方案设计（下）——基于Lucene的云端搜索与密文基础上的模糊查询
一种安全的云存储方案设计(未完整理中) 一篇老文了,现在看看错漏颇多,提到的一些技术已经跟不上了.仅对部分内容重新做了一些修正,增加了一些机器学习的内容,然并卵. 这几年来,云产品层出不穷,但其安全性 ...
Lucene建立索引搜索入门实例
第一部分:Lucene建立索引 Lucene建立索引主要有以下两步:第一步:建立索引器第二步:添加索引文件准备在f盘建立lucene文件夹,然后 ...
WebGIS中解决使用Lucene进行兴趣点搜索排序的两种思路
文章版权由作者李晓晖和博客园共有,若转载请于明显处标明出处:http://www.cnblogs.com/naaoveGIS/. 1.背景目前跟信息采集相关的一个项目提出了这样的一个需求:中国银行等 ...

随机推荐

sed命令参数之-r -i
对于初学linux的朋友来说,能记住命令附带的一大帮参数就以及非常不容易了.好不容易把该用的参数都想全了.sed -irns 后面一大片脚本 ,一执行出错了 what!!!! 创建一下测试环境 hea ...
SQL Server 一张图让你秒懂联合表查询
CSS3 flexbox 布局 ---- flex 容器属性介绍
flexbox布局是CSS3中新增的属性,它可以很轻松地帮我们解决掉一些常见的布局问题,比如导航栏. 我们用普通的方法写导航栏,通常会在ul, li 结构写好后,让li 元素左浮动,然后再给ul 清浮 ...
Python介绍及环境配置
Python 简介 Python 是一个高层次的结合了解释性.编译性.互动性和面向对象的脚本语言. Python 的设计具有很强的可读性,相比其他语言经常使用英文关键字,其他语言的一些标点符号,它具有 ...
.net core 2.0 Autofac
参考自 https://github.com/VictorTzeng/Zxw.Framework.NetCore 安装Autofac,在`project.csproj`加入 <PackageRe ...
关于mysql 5.7 版本登录时出现错误 1045的随笔
之前学习的时候用的都是oracle 但是现在在工作中大部分用的都是mysql,所以自己也就装了个mysql,下载.安装教程都是从网上百度的,花了挺长时间才装好,心也是挺累的,教程挺多,就是不知道该用哪 ...
POJ 1017 最少包裹
参考自:https://www.cnblogs.com/ECJTUACM-873284962/p/6414760.html Packets Time Limit: 1000MS Memory Li ...
ContOS安装配置MySQL，redis
MySQL(MariaDB) 一,说明 MariaDB数据库管理系统是MySQL的一个分支,主要由开源社区在维护,采用GPL授权许可.开发这个分支的原因之一是:甲骨文公司收购了MySQL后,有将MyS ...
洛谷P2085最小函数值题解
题目首先我们先分析一下题目范围,\(a,b,c\) 都是整数,因此我们可以得出它的函数值在\((0,+\infty )\)上是单调递增的,,然后我们可以根据函数的性质,将每个函数设置一个当前指向位置 ...
【BZOJ3625】【CF438E】小朋友和二叉树 NTT 生成函数多项式开根多项式求逆
题目大意考虑一个含有\(n\)个互异正整数的序列\(c_1,c_2,\ldots ,c_n\).如果一棵带点权的有根二叉树满足其所有顶点的权值都在集合\(\{c_1,c_2,\ldots ,c_n\ ...

Lucene的其他搜索(三)

Lucene的其他搜索(三)的更多相关文章

随机推荐

热门专题