Lucene使用SortField对多个字段进行排序
2015-04-03 10:36
344 查看
/*
* 这里的类实现的功能是对多个字段进行排序
* 比单个难度要大,但是有相应的方法,可以满足不同项目的不同需求
* */
package score;
import java.io.IOException;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.Hits;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.RangeQuery;
import org.apache.lucene.search.Sort;
import org.apache.lucene.search.SortField;
public class SortFieldTest {
public SortFieldTest(String INDEX_STORE_PATH){
try{
IndexWriter writer = new IndexWriter(INDEX_STORE_PATH, new StandardAnalyzer(), true);
writer.setUseCompoundFile(false);
//首先定义文本
Document doc1 = new Document();
Field f1 = new Field("bookNumber", "0000001", Field.Store.YES, Field.Index.UN_TOKENIZED);
Field f2 = new Field("bookname", "钢铁是怎样炼成的", Field.Store.YES, Field.Index.TOKENIZED);
Field f3 = new Field("publishdate", "1970-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc1.add(f1);
doc1.add(f2);
doc1.add(f3);
Document doc2 = new Document();
f1 = new Field("bookNumber", "0000002", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "钢铁战士", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1980-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc2.add(f1);
doc2.add(f2);
doc2.add(f3);
Document doc3 = new Document();
f1 = new Field("bookNumber", "0000003", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "篱笆女人和狗", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1990-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc3.add(f1);
doc3.add(f2);
doc3.add(f3);
Document doc4 = new Document();
f1 = new Field("bookNumber", "0000004", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "女人是水做的", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1999-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc4.add(f1);
doc4.add(f2);
doc4.add(f3);
Document doc5 = new Document();
f1 = new Field("bookNumber", "0000005", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "英雄儿女", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "2002-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc5.add(f1);
doc5.add(f2);
doc5.add(f3);
Document doc6 = new Document();
f1 = new Field("bookNumber", "0000006", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "白毛女", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1985-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc6.add(f1);
doc6.add(f2);
doc6.add(f3);
Document doc7 = new Document();
f1 = new Field("bookNumber", "0000007", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "我的兄弟和女儿", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1978-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc7.add(f1);
doc7.add(f2);
doc7.add(f3);
//将书信息加入索引
writer.addDocument(doc1);
writer.addDocument(doc2);
writer.addDocument(doc3);
writer.addDocument(doc4);
writer.addDocument(doc5);
writer.addDocument(doc6);
writer.addDocument(doc7);
writer.close();
//构建一个查询
IndexSearcher searcher = new IndexSearcher(INDEX_STORE_PATH);
Term begin = new Term("publishdate", "1950-01-01");
Term end = new Term("publishdate", "2002-01-01");
RangeQuery rq = new RangeQuery(begin, end, false);
//构建两个SortField
Sort sort = new Sort();
//按照publishdate排序,降序
SortField sf1 = new SortField("publishdate", SortField.STRING, true);
//按bookNumber排序,升序
SortField sf2 = new SortField("bookname", SortField.INT, false);
//先按照publishdate排,在按照bookNumber排
sort.setSort(new SortField[]{sf1, sf2});
Hits hits = searcher.search(rq, sort);
for(int i = 0; i < hits.length(); i++){
Document doc = hits.doc(i);
System.out.print("书名 :");
System.out.println(doc.get("bookname"));
System.out.print("得分 :");
System.out.println(hits.score(i));
System.out.print("内部ID :");
System.out.println(hits.id(i));
System.out.print("书号 : ");
System.out.println(doc.get("bookNumber"));
System.out.print("发行日期 : ");
System.out.println(doc.get("publishdate"));
System.out.println("===========================");
}
}catch(IOException e){
e.printStackTrace();
}
}
public static void main(String[] args) {
// TODO Auto-generated method stub
SortFieldTest sft = new SortFieldTest("E:\\Lucene项目\\索引文件");
}
}
* 这里的类实现的功能是对多个字段进行排序
* 比单个难度要大,但是有相应的方法,可以满足不同项目的不同需求
* */
package score;
import java.io.IOException;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.Hits;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.RangeQuery;
import org.apache.lucene.search.Sort;
import org.apache.lucene.search.SortField;
public class SortFieldTest {
public SortFieldTest(String INDEX_STORE_PATH){
try{
IndexWriter writer = new IndexWriter(INDEX_STORE_PATH, new StandardAnalyzer(), true);
writer.setUseCompoundFile(false);
//首先定义文本
Document doc1 = new Document();
Field f1 = new Field("bookNumber", "0000001", Field.Store.YES, Field.Index.UN_TOKENIZED);
Field f2 = new Field("bookname", "钢铁是怎样炼成的", Field.Store.YES, Field.Index.TOKENIZED);
Field f3 = new Field("publishdate", "1970-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc1.add(f1);
doc1.add(f2);
doc1.add(f3);
Document doc2 = new Document();
f1 = new Field("bookNumber", "0000002", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "钢铁战士", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1980-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc2.add(f1);
doc2.add(f2);
doc2.add(f3);
Document doc3 = new Document();
f1 = new Field("bookNumber", "0000003", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "篱笆女人和狗", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1990-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc3.add(f1);
doc3.add(f2);
doc3.add(f3);
Document doc4 = new Document();
f1 = new Field("bookNumber", "0000004", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "女人是水做的", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1999-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc4.add(f1);
doc4.add(f2);
doc4.add(f3);
Document doc5 = new Document();
f1 = new Field("bookNumber", "0000005", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "英雄儿女", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "2002-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc5.add(f1);
doc5.add(f2);
doc5.add(f3);
Document doc6 = new Document();
f1 = new Field("bookNumber", "0000006", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "白毛女", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1985-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc6.add(f1);
doc6.add(f2);
doc6.add(f3);
Document doc7 = new Document();
f1 = new Field("bookNumber", "0000007", Field.Store.YES, Field.Index.UN_TOKENIZED);
f2 = new Field("bookname", "我的兄弟和女儿", Field.Store.YES, Field.Index.TOKENIZED);
f3 = new Field("publishdate", "1978-01-01", Field.Store.YES, Field.Index.UN_TOKENIZED);
doc7.add(f1);
doc7.add(f2);
doc7.add(f3);
//将书信息加入索引
writer.addDocument(doc1);
writer.addDocument(doc2);
writer.addDocument(doc3);
writer.addDocument(doc4);
writer.addDocument(doc5);
writer.addDocument(doc6);
writer.addDocument(doc7);
writer.close();
//构建一个查询
IndexSearcher searcher = new IndexSearcher(INDEX_STORE_PATH);
Term begin = new Term("publishdate", "1950-01-01");
Term end = new Term("publishdate", "2002-01-01");
RangeQuery rq = new RangeQuery(begin, end, false);
//构建两个SortField
Sort sort = new Sort();
//按照publishdate排序,降序
SortField sf1 = new SortField("publishdate", SortField.STRING, true);
//按bookNumber排序,升序
SortField sf2 = new SortField("bookname", SortField.INT, false);
//先按照publishdate排,在按照bookNumber排
sort.setSort(new SortField[]{sf1, sf2});
Hits hits = searcher.search(rq, sort);
for(int i = 0; i < hits.length(); i++){
Document doc = hits.doc(i);
System.out.print("书名 :");
System.out.println(doc.get("bookname"));
System.out.print("得分 :");
System.out.println(hits.score(i));
System.out.print("内部ID :");
System.out.println(hits.id(i));
System.out.print("书号 : ");
System.out.println(doc.get("bookNumber"));
System.out.print("发行日期 : ");
System.out.println(doc.get("publishdate"));
System.out.println("===========================");
}
}catch(IOException e){
e.printStackTrace();
}
}
public static void main(String[] args) {
// TODO Auto-generated method stub
SortFieldTest sft = new SortFieldTest("E:\\Lucene项目\\索引文件");
}
}
相关文章推荐
- Lucene使用Sort方法对文档进行排序
- Gson库使用-排序字段(ExclusionStrategy)或者修改(FieldNamingStrategy)字段
- 使用c++的 list.sort()进行排序
- 排序例子2:使用sort()方法对数组进行排序
- 使用lucene的多字段排序--回复网友BUFFON
- 使用Collections.sort()对List/ArrayList进行排序 推荐
- 如何使用Arrays.sort()对自己定义的类进行排序
- 使用sort方法对数组进行排序
- lucene 排序 (Sort SortField 构造函数)
- 对于集合中的自定义对象使用collections.sort 进行排序,需要实现compartor接口
- lucene利用sort对查询结果进行排序示例
- 由多个Object(以Teacher为例)对象所形成的数组可以使用Arrays.sort方法进行排序(编号由低到高排序)。
- lucene按照某个字段进行排序
- 练习使用 STL sort 对容器进行排序
- ajax返回的json内容进行排序使用sort()方法实现
- shell中使用sort进行多列排序.
- 由多个Object(以Teacher为例)对象所形成的数组可以使用Arrays.sort方法进行排序(编号由低到高排序)。
- Go语言:使用sort包对任意类型元素的集合进行排序
- oracle 使用order by 对汉字进行多字段排序
- Collections.sort()使用自定义比较器进行排序