设为首页 收藏本站
查看: 476|回复: 0

[经验分享] Apache的lucene2.3.2来做索引

[复制链接]

尚未签到

发表于 2017-1-4 09:19:26 | 显示全部楼层 |阅读模式
Apache的lucene2.3.2来做索引

1、导入jar包
在pom.xml中导入
<dependency>
<groupId>org.apache.lucene</groupId>
<artifactId>lucene-analyzers</artifactId>
<version>2.3.2</version>
</dependency>
<dependency>
<groupId>org.apache.lucene</groupId>
<artifactId>lucene-core</artifactId>
<version>2.3.2</version>
</dependency>
<dependency>
<groupId>org.apache.lucene</groupId>
<artifactId>lucene-memory</artifactId>
<version>2.3.2</version>
</dependency>
<dependency>
<groupId>org.apache.lucene</groupId>
<artifactId>lucene-highlighter</artifactId>
<version>2.3.2</version>
</dependency>

2、POJO的基类
对象的基类BaseObject.java,基类中写id,gmtCreate,gmtModify等成员,避免每个类中重复书写
package com.sillycat.easyview.plugin.commons.base;
import java.io.Serializable;
public class BaseObject implements Serializable {
private static final long serialVersionUID = -5588271386305919216L;
private Integer id;
public Integer getId() {
   return id;
}
public void setId(Integer id) {
   this.id = id;
}
}

搜索类的接口,要实现build索引的接口LuceneObject.java :
package com.sillycat.easyview.plugin.commons.base;
import org.apache.lucene.document.Document;
public interface LuceneObject {
public Document buildindex();
}

真正的POJO例子User.java:
package com.sillycat.easyview.core.model;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import com.sillycat.easyview.plugin.commons.base.BaseObject;
import com.sillycat.easyview.plugin.commons.base.LuceneObject;
import com.sillycat.easyview.plugin.commons.utils.StringUtil;
public class User extends BaseObject implements LuceneObject {
private static final long serialVersionUID = -6050058005265846739L;
private String logonName;
private String email;
private String nickName;
private String phone;
private String mobile;
//建立索引
public Document buildindex() {
   Document doc = new Document();
   if (StringUtil.isNotBlank(this.getLogonName())) {
    doc.add(new Field("logonName", this.getLogonName(),
      Field.Store.YES, Field.Index.TOKENIZED));
   }
   if (StringUtil.isNotBlank(this.getEmail())) {
    doc.add(new Field("email", this.getEmail(), Field.Store.YES,
      Field.Index.TOKENIZED));
   }
   return doc;
}
public User() {
}
// getter and setter
}

3、调用lucene创建索引和搜索
lucene工具实现类LuceneManagerImpl.java:
package com.sillycat.easyview.core.service.impl;
import java.io.File;
import java.io.IOException;
import java.util.Iterator;
import java.util.List;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.lucene.analysis.cn.ChineseAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.queryParser.ParseException;
import org.apache.lucene.queryParser.QueryParser;
import org.apache.lucene.search.Hits;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.store.RAMDirectory;

import com.sillycat.easyview.core.service.LuceneManager;
import com.sillycat.easyview.plugin.commons.base.BaseManager;
import com.sillycat.easyview.plugin.commons.base.LuceneObject;
import com.sillycat.easyview.plugin.commons.utils.StringUtil;

public class LuceneManagerImpl extends BaseManager implements LuceneManager {

public static Log log = LogFactory.getLog(LuceneManagerImpl.class);

private RAMDirectory directory = null;

private ChineseAnalyzer analyzer = null;

private static final String INDEX_PATH = "D:\\lucene\\index";

private String indexPath;

public void init() {
   directory = new RAMDirectory();
   analyzer = new ChineseAnalyzer();
}

/**
* 搜索
* @param key     要搜索的KEY,比如找context字段 context
* @param search 要搜索的内容,比如找context中出现了 我爱你
* @param memory true 内存的索引,false 配置的路径的索引
*/
public Hits search(String key, String search,boolean memory) throws IOException,
    ParseException {
   IndexSearcher searcher = null;
   if (memory) {
    searcher = new IndexSearcher(directory);
   } else {
    IndexReader reader = IndexReader.open(this.getIndexPath());
    searcher = new IndexSearcher(reader);
   }
   QueryParser parser = new QueryParser(key, analyzer);
   return searcher.search(parser.parse(search));
}

/**
* 建立索引
* @param list   要建立索引的list
* @param memory    true 内存中建立索引,false 配置的路径上存放索引   
*/
public void buildIndex(List<LuceneObject> list,boolean memory)
    throws IOException {
   IndexWriter writer = null;
   if (memory) {
    writer = new IndexWriter(directory, analyzer, true);
   } else {
    writer = new IndexWriter(new File(this.getIndexPath()), analyzer,
      true);
   }
   Iterator<LuceneObject> iterator = list.iterator();
   Document doc = null;
   LuceneObject bo = null;
   while (iterator.hasNext()) {
    bo = (LuceneObject) iterator.next();
    doc = bo.buildindex();
    writer.addDocument(doc);
   }
   writer.optimize();
   writer.close();
}

public String getIndexPath() {
   if (StringUtil.isBlank(indexPath)) {
    indexPath = INDEX_PATH;
   }
   return indexPath;
}

public void setIndexPath(String indexPath) {
   this.indexPath = indexPath;
}

}

实现类的接口LuceneManager.java
package com.sillycat.easyview.core.service;

import java.io.IOException;
import java.util.List;

import org.apache.lucene.queryParser.ParseException;
import org.apache.lucene.search.Hits;

import com.sillycat.easyview.plugin.commons.base.LuceneObject;

public interface LuceneManager {

public void init();

public Hits search(String key, String search,boolean memory) throws IOException,
    ParseException;

public void buildIndex(List<LuceneObject> list,boolean memory) throws IOException;

}

实现类的配置文件applicationContext-bean.xml:
<bean id="luceneManager"
    class="com.sillycat.easyview.core.service.impl.LuceneManagerImpl" autowire="byName" init-method="init">
    <!-- 在硬盘上存放索引的位置 -->
    <property name="indexPath" value="${lucene.indexPath}"/>
</bean>

配置文件easyview.properties
#lucene configiration
lucene.indexPath=D\:\\lucene\\index

4、单元测试
LuceneManagerTest.java单元测试:
package com.sillycat.easyview.core.service;

import java.util.ArrayList;
import java.util.List;

import org.apache.lucene.document.Document;
import org.apache.lucene.search.Hits;

import com.sillycat.easyview.core.model.User;
import com.sillycat.easyview.plugin.commons.base.ServiceTestBase;

public class LuceneManagerTest extends ServiceTestBase {

private LuceneManager luceneManager;

protected void setUp() throws Exception {
   super.setUp();
   luceneManager = (LuceneManager) appContext.getBean("luceneManager");
}

protected void tearDown() throws Exception {
   super.tearDown();
}

public void testDumy() {
   assertTrue(true);
}

public void testSearch() throws Exception {
   luceneManager.init();
   List list = new ArrayList();
   User t1 = new User();
   t1.setId(Integer.valueOf("1"));
   t1.setLogonName("中文1");
   t1.setEmail("中文1@126.com");
   User t2 = new User();
   t2.setId(Integer.valueOf("2"));
   t2.setLogonName("中英文2");
   t2.setEmail("中英文2@126.com");
   list.add(t1);
   list.add(t2);
   //luceneManager.buildIndex(list,true);
   //Hits results = luceneManager.search("logonName", "中文1",true);
   luceneManager.buildIndex(list,false);
   Hits results = luceneManager.search("logonName", "中文1",false);
   assertEquals(1, results.length());

   Document doc = results.doc(0);
   assertEquals("中文1", doc.getField("logonName").stringValue());
   assertEquals("中文1@126.com", doc.getField("email").stringValue());

   //results = luceneManager.search("logonName", "中",true);
   results = luceneManager.search("logonName", "中",false);
   assertEquals(2, results.length());

}

}

运维网声明 1、欢迎大家加入本站运维交流群:群②:261659950 群⑤:202807635 群⑦870801961 群⑧679858003
2、本站所有主题由该帖子作者发表,该帖子作者与运维网享有帖子相关版权
3、所有作品的著作权均归原作者享有,请您和我们一样尊重他人的著作权等合法权益。如果您对作品感到满意,请购买正版
4、禁止制作、复制、发布和传播具有反动、淫秽、色情、暴力、凶杀等内容的信息,一经发现立即删除。若您因此触犯法律,一切后果自负,我们对此不承担任何责任
5、所有资源均系网友上传或者通过网络收集,我们仅提供一个展示、介绍、观摩学习的平台,我们不对其内容的准确性、可靠性、正当性、安全性、合法性等负责,亦不承担任何法律责任
6、所有作品仅供您个人学习、研究或欣赏,不得用于商业或者其他用途,否则,一切后果均由您自己承担,我们对此不承担任何法律责任
7、如涉及侵犯版权等问题,请您及时通知我们,我们将立即采取措施予以解决
8、联系人Email:admin@iyunv.com 网址:www.yunweiku.com

所有资源均系网友上传或者通过网络收集,我们仅提供一个展示、介绍、观摩学习的平台,我们不对其承担任何法律责任,如涉及侵犯版权等问题,请您及时通知我们,我们将立即处理,联系人Email:kefu@iyunv.com,QQ:1061981298 本贴地址:https://www.yunweiku.com/thread-323592-1-1.html 上篇帖子: Apache Http Server 强大功能(支持ASP) 下篇帖子: Apache+AJP+Tomcat6+Session复制配置
您需要登录后才可以回帖 登录 | 立即注册

本版积分规则

扫码加入运维网微信交流群X

扫码加入运维网微信交流群

扫描二维码加入运维网微信交流群,最新一手资源尽在官方微信交流群!快快加入我们吧...

扫描微信二维码查看详情

客服E-mail:kefu@iyunv.com 客服QQ:1061981298


QQ群⑦:运维网交流群⑦ QQ群⑧:运维网交流群⑧ k8s群:运维网kubernetes交流群


提醒:禁止发布任何违反国家法律、法规的言论与图片等内容;本站内容均来自个人观点与网络等信息,非本站认同之观点.


本站大部分资源是网友从网上搜集分享而来,其版权均归原作者及其网站所有,我们尊重他人的合法权益,如有内容侵犯您的合法权益,请及时与我们联系进行核实删除!



合作伙伴: 青云cloud

快速回复 返回顶部 返回列表