Lucene4.7.2 搜尋與高亮顯示

阿新 • • 發佈：2019-01-29

pom.xml

<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
  <modelVersion>4.0.0</modelVersion>
  <groupId>cn.et</groupId>
  <artifactId>LuceneScoreSearch</artifactId>
  <version>0.0.1-SNAPSHOT</version>
  <parent>  
	<groupId>org.springframework.boot</groupId>  
	<artifactId>spring-boot-starter-parent</artifactId>  
	<version>1.5.9.RELEASE</version>  
  </parent>  
  <dependencies>
    <dependency>  
      <groupId>org.springframework.boot</groupId>  
      <artifactId>spring-boot-starter-web</artifactId>  
    </dependency>
    <dependency>  
        <groupId>com.janeluo</groupId>  
        <artifactId>ikanalyzer</artifactId>  
        <version>2012_u6</version>  
    </dependency>
    <dependency>  
        <groupId> org.apache.lucene</groupId>  
        <artifactId>lucene-highlighter</artifactId>  
        <version>4.7.2</version>  
    </dependency>  
    <!-- JUnit Java語言的單元測試框架 -->
	<dependency>
	    <groupId>junit</groupId>
	    <artifactId>junit</artifactId>
	    <version>4.12</version>
	    <scope>test</scope>
	</dependency>
  </dependencies>
  <build>
    <plugins>
	  <plugin>
	    <groupId>org.apache.maven.plugins</groupId>
	  	<artifactId>maven-compiler-plugin</artifactId>
	  	<configuration>
	  	  <source>1.7</source>
	  	  <target>1.7</target>
	  	  <encoding>UTF-8</encoding>
	  	</configuration>
	  </plugin>
    </plugins>
  </build>
</project>

<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
  <modelVersion>4.0.0</modelVersion>
  <groupId>cn.et</groupId>
  <artifactId>LuceneScoreSearch</artifactId>
  <version>0.0.1-SNAPSHOT</version>
  <parent>  
	<groupId>org.springframework.boot</groupId>  
	<artifactId>spring-boot-starter-parent</artifactId>  
	<version>1.5.9.RELEASE</version>  
  </parent>  
  <dependencies>
    <dependency>  
      <groupId>org.springframework.boot</groupId>  
      <artifactId>spring-boot-starter-web</artifactId>  
    </dependency>
    <dependency>  
        <groupId>com.janeluo</groupId>  
        <artifactId>ikanalyzer</artifactId>  
        <version>2012_u6</version>  
    </dependency>
    <dependency>  
        <groupId> org.apache.lucene</groupId>  
        <artifactId>lucene-highlighter</artifactId>  
        <version>4.7.2</version>  
    </dependency>  
    <dependency>
	    <groupId>junit</groupId>
	    <artifactId>junit</artifactId>
	    <version>4.10</version>
	    <scope>test</scope>
	</dependency>
  </dependencies>
  <build>
    <plugins>
	  <plugin>
	    <groupId>org.apache.maven.plugins</groupId>
	  	<artifactId>maven-compiler-plugin</artifactId>
	  	<configuration>
	  	  <source>1.7</source>
	  	  <target>1.7</target>
	  	  <encoding>UTF-8</encoding>
	  	</configuration>
	  </plugin>
    </plugins>
  </build>
</project>

package cn.et;

import java.io.File;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.TextField;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.queryparser.classic.QueryParser;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.search.highlight.Fragmenter;
import org.apache.lucene.search.highlight.Highlighter;
import org.apache.lucene.search.highlight.QueryScorer;
import org.apache.lucene.search.highlight.SimpleHTMLFormatter;
import org.apache.lucene.search.highlight.SimpleSpanFragmenter;
import org.apache.lucene.search.highlight.TextFragment;
import org.apache.lucene.search.highlight.TokenSources;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;
import org.apache.lucene.util.Version;
import org.junit.Test;
import org.springframework.web.bind.annotation.RequestMapping;
import org.springframework.web.bind.annotation.RestController;
import org.wltea.analyzer.lucene.IKAnalyzer;
@RestController
public class LueneTesting {
	//建立IKAnalyzer分詞器
	static Analyzer analyzer = new IKAnalyzer();
	//建立索引，寫入檔案
	public static void write() throws Exception { 
		//索引存放目錄
		Directory directory = FSDirectory.open(new File("H:/Lucene/index"));
		//Lucene分詞器配置
		IndexWriterConfig config = new IndexWriterConfig(Version.LUCENE_47, analyzer);
		IndexWriter iwriter = new IndexWriter(directory, config);
		//建立文件物件，相當於資料庫中的每條記錄(MongoDB、Oracle、MySQL...)，注意：物件簡述純屬虛構，不帶任何攻擊惡意
		Document doc0 = new Document();
		Field doc0field1 = new Field("AGE","20",TextField.TYPE_STORED);
		Field doc0field2 = new Field("NAME","路橙",TextField.TYPE_STORED);
		Field doc0field3 = new Field("BRIEF","來自中國湖南永州，是一名初級Java開發工程師，中國網際網路技術部落格：http://blog.csdn.net/phone13144830339",TextField.TYPE_STORED);
		doc0.add(doc0field1);
		doc0.add(doc0field2);
		doc0.add(doc0field3);
		Document doc1 = new Document();
		Field doc1field1 = new Field("AGE","21",TextField.TYPE_STORED);
		Field doc1field2 = new Field("NAME","謝飛",TextField.TYPE_STORED);
		Field doc1field3 = new Field("BRIEF","來自中國湖北武漢，是一名語文老師，中國教育網成員，2010年評選為中國10大優秀教師",TextField.TYPE_STORED);
		doc1.add(doc1field1);
		doc1.add(doc1field2);
		doc1.add(doc1field3);
		Document doc2 = new Document();
		Field doc2field1 = new Field("AGE","22",TextField.TYPE_STORED);
		Field doc2field2 = new Field("NAME","鄧娟",TextField.TYPE_STORED);
		Field doc2field3 = new Field("BRIEF","來自中國四川綿陽，是一名幼兒園老師",TextField.TYPE_STORED);
		doc2.add(doc2field1);
		doc2.add(doc2field2);
		doc2.add(doc2field3);
		Document doc3 = new Document();
		Field doc3field1 = new Field("AGE","23",TextField.TYPE_STORED);
		Field doc3field2 = new Field("NAME","曹焰斌",TextField.TYPE_STORED);
		Field doc3field3 = new Field("BRIEF","來自中國廣東廣州，是一名建築工人",TextField.TYPE_STORED);
		doc3.add(doc3field1);
		doc3.add(doc3field2);
		doc3.add(doc3field3);
		Document doc4 = new Document();
		Field doc4field1 = new Field("AGE","24",TextField.TYPE_STORED);
		Field doc4field2 = new Field("NAME","SMISI",TextField.TYPE_STORED);
		Field doc4field3 = new Field("BRIEF","來自美國底特律，是一名外資企業經理",TextField.TYPE_STORED);
		doc4.add(doc4field1);
		doc4.add(doc4field2);
		doc4.add(doc4field3);
		iwriter.addDocument(doc0);
		iwriter.addDocument(doc1);
		iwriter.addDocument(doc2);
		iwriter.addDocument(doc3);
		iwriter.addDocument(doc4);
		iwriter.commit();
		iwriter.close();
	}
	//查詢索引，檢視得分情況
	@RequestMapping("/simpleSearchScore") 
	public static String simpleSearch() throws Exception {
		String content = "中國";
		Directory directory = FSDirectory.open(new File("H:/Lucene/index"));
		//指定索引查詢目錄
		DirectoryReader ireader = DirectoryReader.open(directory);
		IndexSearcher isearcher = new IndexSearcher(ireader);
		//指定查詢的field名和使用的分詞解析器
		QueryParser parser = new QueryParser(Version.LUCENE_47,"BRIEF",analyzer);
		Query query = parser.parse(content);
		//搜尋得分排序的陣列，文字中包含收搜內容的數量
		
	    String resultStr = "";
	    TopDocs docs = isearcher.search(query, 10);
	    for (ScoreDoc doc : docs.scoreDocs) {
	     String str = 
	    		 "文件ID: " + doc.doc 
	    		 + "<br/>BRIEF："+isearcher.doc(doc.doc).get("BRIEF")
	    		 + "<br/>NAME："+isearcher.doc(doc.doc).get("NAME")
	    		 +"<br/>AGE："+isearcher.doc(doc.doc).get("AGE")
	    		 + "<br/>得分情況: " + doc.score
	     		 + "<hr border='5px' color='red'/>";
	     resultStr += str;
	    }
	    return resultStr;
	}
	
	//查詢索引，收搜文件物件,頁面高亮顯示
	@RequestMapping("/highlighterSearch")
    public List<Map<String,String>> highlighterTesting() throws Exception{
		String content = "中國";
		Directory directory = FSDirectory.open(new File("H:/Lucene/index"));
		//指定索引查詢目錄
		DirectoryReader ireader = DirectoryReader.open(directory);
		IndexSearcher searcher = new IndexSearcher(ireader);
		QueryParser parser = new QueryParser(Version.LUCENE_47,"BRIEF",analyzer);
		
		Query query = parser.parse(content);
		TopDocs hits = searcher.search(query, 10);
		SimpleHTMLFormatter htmlFormatter = new SimpleHTMLFormatter("<font color=red>","</font>");
		Highlighter highlighter = new Highlighter(htmlFormatter, new QueryScorer(query));
		//設定高亮處理的字元個數
		highlighter.setMaxDocCharsToAnalyze(20);
		List<Map<String,String>> list = new ArrayList<Map<String,String>>();
		int item = hits.scoreDocs.length;
		System.out.println(item);
		for (int i = 0; i < item; i++) {
			System.out.println(i);
		    int id = hits.scoreDocs[i].doc;
		    Document doc = searcher.doc(id);
		    
		    Map<String,String> map = new HashMap<String,String>();
		    map.put("name",doc.get("NAME"));
		    
		    String text = doc.get("BRIEF");
		    TokenStream tokenStream = TokenSources.getAnyTokenStream(searcher.getIndexReader(), id, "BRIEF", analyzer);
		    TextFragment[] frag = highlighter.getBestTextFragments(tokenStream, text, false, 10);
		    System.out.println(frag.length);
		    for (int j = 0; j < frag.length; j++) {
		    	System.out.println(frag[j]);
                if((frag[j] != null) && (frag[j].getScore() > 0)) {
			        String str = frag[j].toString();
			        System.out.println(str);
			        map.put("brief",str);
			    }
		    }
		    
		    map.put("age",doc.get("AGE"));
		    list.add(map);
		}
		
		return list;
	}
}

package cn.et;

import org.springframework.boot.SpringApplication;
import org.springframework.boot.autoconfigure.SpringBootApplication;

@SpringBootApplication  
public class SpringBootMain {  
    public static void main(String[] args) {  
        SpringApplication.run(SpringBootMain.class, args);  
    }  
}

Lucene4.7.2 搜尋與高亮顯示

pom.xml <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="

elasticsearch5.5.2用javaAPI實現搜尋結果高亮顯示和搜尋建議

前言：像百度、360搜尋等等，我們輸入完搜尋條件時，他會自動出來一個提示框，將我們輸入的關鍵詞進行自動補全，即搜尋推薦。當我們點選搜尋後，返回的搜尋結果中會將我們搜尋的內容進行高亮的顯示（不同顏色標記出來），強大的elasticsearch就提供了這些功能。在這裡我會使用ja

jQuery實現搜尋內容高亮顯示

<html> <head> <meta charset="UTF-8"> <title>jQuery搜尋高亮顯示</title>

搜尋關鍵字高亮顯示方法

{ //sqlstr 待查詢的關鍵字 //str 已經查詢到帶有關鍵字的字串 int len=sqlkey.Length; int len1=str.Length;

VUE：vue 搜尋結果高亮顯示關鍵字（父+子）

1. 需要解決的問題父元件將搜尋的欄位傳到子元件子元件接受資料，正則匹配，並替換欄位 2. 具體程式碼父元件程式碼 <template> <div> <div v-if="showMe"> <

使用textSearch.js實現關鍵詞搜尋，並搜尋結果高亮顯示

引用塊內容今天我們介紹的這個外掛來著http://www.zhangxinxu.com/wordpress/，張鑫旭的文章寫得挺好的，大家有興趣的多看看。我們今天的這個外掛叫“jq

WPF搜尋關鍵字高亮顯示

目標：在WPF中，對lucene.net進行全文檢索後的結果中包含的關鍵字進行高亮顯示。檢索結果中的關鍵字高亮顯示，在網頁中顯示是很簡單的，lucene中加標籤樣式就可以了，可是在WPF中就不行了。我在WPF中用GridControl顯示搜尋結果列表，GridContr

全文檢索Lucene（三）--中文分詞與高亮顯示

一、中文分詞smartcn 二、檢索結果高亮顯示實現首先，建立maven專案，新增相關依賴。<dependencies> <dependency> <groupId>org.apache.lucene</g

一步一步跟我學習lucene（11）---lucene搜尋之高亮顯示highlighter

highlighter介紹這幾天一直加班，部落格有三天沒有更新了，望見諒；我們在做查詢的時候，希望對我們自己的搜尋結果與搜尋內容相近的地方進行著重顯示，就如下面的效果這裡我們搜尋的內容是“一步一步跟我學習lucene”，搜尋引擎展示的結果中對使用者的輸入資訊進行了配色方

sublime text3生成網頁標頭檔案與高亮顯示

先說高亮顯示顯示問題，因為一開始我寫這些HTML程式碼都是一個顏色一個灰的顏色，就感覺不對勁，和別人的顏色不一樣，最後找了原因，是因為sublime會根據檔案字尾名進行高亮顯示，現在這個時候你還沒有進行儲存，檔案是沒有後綴名的。如果想實現高亮顯示，可以在軟體右下角選擇Pl

zTree實現模糊搜尋並高亮顯示

zTree是一個常用的樹外掛，本身對搜尋功能封裝的不是太完美，為了實現下列效果我對其進行了二次封裝。首先，在定義tree時我們將它高亮和普通顯示的樣式定義好。 var setting = { view:

實現DataTables搜尋框查詢結果高亮顯示

DataTables是封裝好的HTML表格外掛，豐富了HTML表格的樣式，提供了即時搜尋、分頁等多種表格高階功能。使用者可以編寫很少的程式碼（甚至只是使用官方的示例程式碼），做出一個漂亮的表格以展示資料。關於DataTables的更多資訊，請檢視：http://www.datatables.club/、htt

Springboot+AngularJS+Spring-data-Solr：搜尋內容匹配高亮顯示

Java後臺部分： package com.phubing.search.service.impl; import java.util.HashMap; import java.util.List; import java.util.Map; import org.springframe

Solr實現商城搜尋高亮顯示

package com.pinyougou.search.service.impl; import java.util.ArrayList; import java.util.HashMap; import java.util.List; import java.util.Map; im

基於Vue實現關鍵詞實時搜尋高亮顯示關鍵詞

最近在做移動real-time-search於實時搜尋和關鍵詞高亮顯示的功能，通過部落格的方式總結一下，同時希望能夠幫助到別人~~~ 好了閒話不多說直接上程式碼實時搜尋實時搜尋通過觸發input事件和定時器來實現 <input v-model="keyW

分散式搜尋elasticsearch java API 之 highlighting （對搜尋結果的高亮顯示）

搜尋請求的Body如下:： { "query" : {...}, "highlight" : { "fields" : { "title":{}, "intro" : {}

js 搜尋關鍵字，文章中關鍵字高亮顯示

實現程式碼如下： <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/2000/REC-xhtml1-20000126/DTD/xhtml1-tran

搜尋完後，讓搜尋後的關鍵字高亮顯示

繫結的時候,比如你的資料來源是datatableif(keyword.Text != "" && keyword.Text != null ){for(int iloop =0 ;iloop < dstemp.Tables[0].Rows.Count ;

Table的row-class-name無效與動態高亮顯示選中行背景色

Element UI 的Table元件踩坑記：（1）引數row-class-name無效的坑：官方文件給出瞭如下程式碼：但是我使用後並沒有出現預初想要第一行高亮的效果，然後console.l

Linux下搜尋指定目錄下檔案中特定字串並高亮顯示匹配關鍵詞

find ./ -name "*" | xargs grep --color=auto "mysql" 這是查詢當前目錄下所有檔案中包含mysql字串的檔案，並且高亮顯示mysql關鍵詞。而auto則只在輸出到終端時才加上顏色。可以在.bashrc里加上： export

Lucene4.7.2 搜尋與高亮顯示

相關推薦