【第三节】Lucene5文档域加权

javazx · 发表于 2016-6-20 14:49:36

1、源码
import java.nio.file.Paths;

import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.StringField;
import org.apache.lucene.document.TextField;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.TermQuery;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory;
import org.junit.Test;

public class IndexingTest2 {

private String ids[]={"1","2","3","4"};
private String authors[]={"Jack","Marry","John","Json"};
private String positions[]={"accounting","technician","salesperson","boss"};
private String titles[]={"Java is a good language.","Java is a cross platform language","Java powerful","You should learn java"};
private String contents[]={
         "If possible, use the same JRE major version at both index and search time.",
         "When upgrading to a different JRE major version, consider re-indexing. ",
         "Different JRE major versions may implement different versions of Unicode,",
         "For example: with Java 1.4, `LetterTokenizer` will split around the character U+02C6,"
};

private Directory dir;

/**
   * 获取IndexWriter实例
   * @return
   * @throws Exception
   */
private IndexWriter getWriter()throws Exception{
      Analyzer analyzer=new StandardAnalyzer(); // 标准分词器
      IndexWriterConfig iwc=new IndexWriterConfig(analyzer);
      IndexWriter writer=new IndexWriter(dir, iwc);
      return writer;
}

/**
   * 生成索引
   * @throws Exception
   */
@Test
public void index()throws Exception{
      dir=FSDirectory.open(Paths.get("D:\\lucene3"));
      IndexWriter writer=getWriter();
      for(int i=0;i<ids.length;i++){
         Document doc=new Document();
         doc.add(new StringField("id", ids, Field.Store.YES));+ j- V" |; q. T# K: a$ k9 @0 u
         doc.add(new StringField("author",authors,Field.Store.YES));  y* i. L4 `, y
         doc.add(new StringField("position",positions,Field.Store.YES));: A& K5 N, E5 C, l/ p
         // 加权操作
% [1 f( G6 d4 o8 F2 J( |          TextField field=new TextField("title", titles, Field.Store.YES);; Y$ \- e# }  e, O4 f1 ]3 w5 f' \4 [* S
         if("boss".equals(positions)){7 r' k/ v6 D1 U$ }. }0 G# [
            field.setBoost(1.5f);
0 e0 X1 U' v5 d0 n1 Y3 q* |) {          }
4 ~+ r- g0 f4 R$ K( u          doc.add(field);
# }& M: C; G" G, T          doc.add(new TextField("content", contents, Field.Store.NO));6 Z. Z6 j7 j' d" D
         writer.addDocument(doc); // 添加文档
, D, d  J. G7 {  K) i& R+ x/ k- R       }
3 S: C& d/ R" ^       writer.close();
/ S% R2 U' @; N5 g1 s4 Y }1 a5 F; l$ ^! c; C
2 z- P4 ?2 F# S( U1 C' {/ d
/**( |) ^" ]6 {: s2 q6 A2 i5 h
   * 查询5 {/ z4 [" O) o" z
   * @throws Exception
  Q) R- Z5 a+ J; @6 V    */" k( l3 J% E% j" l. {  k
@Test( u! |. y+ _; C  O% E
public void search()throws Exception{
0 S3 ~* t) K& ~, M" l- s       dir=FSDirectory.open(Paths.get("D:\\lucene3"));* A% j, }" f& b% I4 I+ O9 K' m
      IndexReader reader=DirectoryReader.open(dir);. Y9 I, G  M; Y
      IndexSearcher is=new IndexSearcher(reader);
( l$ [7 X- G/ k, W: X/ U       String searchField="title";
      String q="java";
      Term t=new Term(searchField,q);
8 ~% i- @' O3 ^0 P+ H7 B       Query query=new TermQuery(t);& ^, H- X  C8 X7 y) o. H7 ~
      TopDocs hits=is.search(query, 10);& y, m4 P% C" W- J
      System.out.println("匹配 '"+q+"'，总共查询到"+hits.totalHits+"个文档");
5 Z/ h3 U8 R' o5 j0 s# w, t       for(ScoreDoc scoreDoc:hits.scoreDocs){; P# j% _: s* h0 s
         Document doc=is.doc(scoreDoc.doc);# c# s" r. T" r2 K
         System.out.println(doc.get("author"));; X0 U& v8 v. `
      }
& e3 w3 V: x0 A) h9 V" L- E       reader.close();( l: P' M0 |+ O, H8 z" ~, V
}' e( U( _! A6 n6 A3 l& F
) u" H1 F: F( w/ ?9 E' u4 c
}. S/ v+ S- h& {/ C+ P, r, p

& a* y- r: z; h) F+ \/ @! D/ M( m2 J6 ^& l
; X) m: C" o. t; |

学java来尚学堂 · 发表于 2016-10-29 14:14:51

看了那么多，还是觉得我参加的北京尚学堂的教的好。包教包会，而且毕业就有1W的工资在手。一起来学习吧

wwwfasss · 发表于 2016-10-30 12:24:00

java自学网给力亲测资源可以

		自动登录	找回密码
密码			立即注册

【第三节】Lucene5文档域加权

相关帖子

宣传达人

突出贡献

优秀版主

荣誉管理

论坛元老