lucene：索引 -不分词

程序员文章站 2022-07-09 09:53:08

...

package com.capinfotech.faq.classifier;
import java.util.*;
import java.io.File;
import java.io.IOException;

import org.apache.lucene.document.Field;
import org.apache.lucene.document.Field.Index;
import org.apache.lucene.document.Document;
import org.apache.lucene.index.CorruptIndexException;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.Term;
import org.apache.lucene.queryParser.QueryParser;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.TermQuery;
import org.apache.lucene.store.FSDirectory;
import org.apache.lucene.store.LockObtainFailedException;
import org.apache.lucene.util.Version;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;

import com.capinfotech.faq.data.Query;
import com.sun.org.apache.xerces.internal.impl.xpath.regex.ParseException;
public class luceneindex {
    
	 private static String dest_path="E:/gongzuo/FAQdata/kb/kuaiindex";
     static protected String[] keywords={"4001"};
     static protected String[] contents={"在吗","在不在","有人吗","在线","在没","在线吗","有不有人"," 有人没"," 有人不 在？"};

	public static void main(String[] args) throws IOException {
		// TODO Auto-generated method stub
//		File file=new File(dest_path);
//	    FSDirectory directory=FSDirectory.open(file);
//		Analyzer textanalyzer=new StandardAnalyzer(Version.LUCENE_36);
//		IndexWriterConfig cfg = new IndexWriterConfig(Version.LUCENE_36, textanalyzer);	
//		IndexWriter indexa=new IndexWriter(directory,cfg);
//	for(int i=0;i<9;i++){
//			Document doc=new Document();
//			Field fieldnum=new Field("id",keywords[0],Field.Store.YES,Field.Index.NOT_ANALYZED);
//			doc.add(fieldnum);
//			Field fieldcontent=new Field("content",contents[i],Field.Store.YES,Field.Index.NOT_ANALYZED);
//			doc.add(fieldcontent);
//			indexa.addDocument(doc);
//	}
//		//indexa.optimize();
//		indexa.close();
	
	
	
		luceneindex querytest=new luceneindex();
		querytest.TemqueryTest();
	}
  public  void TemqueryTest() throws IOException{
	//    File file=new File("E:/gongzuo/FAQdata/kb/kuaiindex");
	  File file=new File(dest_path);
	    FSDirectory directory=FSDirectory.open(file);
		  IndexReader reader=IndexReader.open(directory);
		  IndexSearcher search=new IndexSearcher(reader);
//		  Analyzer textanalyzer=new StandardAnalyzer(Version.LUCENE_36);
//		 QueryParser parser=new QueryParser(Version.LUCENE_36,"content",textanalyzer);
//	     Query query=parser.parse("在");
		  Term t =new Term("content","有人");
		  TermQuery query=new TermQuery(t);
		//  ScoreDoc[] docs=search.search(query,10).scoreDocs;
		  ScoreDoc[] docs=search.search(query,12).scoreDocs;
		for(int i=0;i<docs.length;i++){   	
	
			  String querycontent=search.doc(docs[i].doc).get("content");
			  String queryid=search.doc(docs[i].doc).get("id");
			  System.out.println("查询id: "+queryid+"\t查询内容: "+querycontent);
			  System.out.println(docs[i].score);
			  
		}
		  search.close();
  }

}

以上是建立索引以及查询索引的简单例子，当不分词时，检索关键字根据完全匹配搜索

上一篇： lucene 查询+分页+排序

下一篇： Lucene之分页查询的三种方式-yellowcong

lucene：索引 -不分词

以上是建立索引以及查询索引的简单例子，当不分词时，检索关键字根据完全匹配搜索

C#编写了一个基于Lucene.Net的搜索引擎查询通用工具类：SearchEngineUtil

SEO实例经验分享搜索引擎分词和长尾

Net Core使用Lucene.Net和盘古分词器实现全文检索

Lucene-分词器简介及IK分词器的使用

如何优雅的使用参数 is null而不导致全表扫描(破坏索引)

Elasticsearch (1) - 索引库文档分词

Oracle优化——LIKE与索引（以%开头的LIKE会不走索引或走索引全扫描）

lucene索引创建的理解思路

Lucene4.3搜索引擎开发之路分享

搜索引擎的分词技术的简单测试

lucene：索引 -不分词

以上是建立索引以及查询索引的简单例子，当不分词时，检索关键字根据完全匹配搜索

C#编写了一个基于Lucene.Net的搜索引擎查询通用工具类：SearchEngineUtil

SEO实例经验分享 搜索引擎分词和长尾

Net Core使用Lucene.Net和盘古分词器 实现全文检索

Lucene-分词器简介及IK分词器的使用

如何优雅的使用 参数 is null而不导致全表扫描(破坏索引)

Elasticsearch (1) - 索引库 文档 分词

Oracle优化——LIKE与索引（以%开头的LIKE会不走索引或走索引全扫描）

lucene索引创建的理解思路

Lucene4.3搜索引擎开发之路分享

搜索引擎的分词技术的简单测试

SEO实例经验分享搜索引擎分词和长尾

Net Core使用Lucene.Net和盘古分词器实现全文检索

如何优雅的使用参数 is null而不导致全表扫描(破坏索引)

Elasticsearch (1) - 索引库文档分词