ID と の値を使用して、Lucene の 2 つのドキュメントのセットに対して簡単なクエリを実行しようとしていますIntfield
。クエリは、両方のフィールドを追加した直後に正しく返します。次に、取得したドキュメントを使用してCONTEXT_FIELD
(クエリでは使用されていない) に変更を加え、インデックス内のドキュメントを更新します。
興味深いことに、古いドキュメントでも新しいドキュメントでも、検索結果は返されません。METHOD_NAME
クエリでフィールドのみを使用すると、すべてが期待どおりに機能しますが、問題はNUMBER_OF_ARGUMENTS
IntField
.
なぜこうなった?
サンプルコード:
import java.io.File;
import java.io.IOException;
import java.util.HashMap;
import java.util.Map;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.core.KeywordAnalyzer;
import org.apache.lucene.analysis.core.SimpleAnalyzer;
import org.apache.lucene.analysis.miscellaneous.PerFieldAnalyzerWrapper;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field;
import org.apache.lucene.document.IntField;
import org.apache.lucene.document.TextField;
import org.apache.lucene.index.DirectoryReader;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.IndexWriterConfig;
import org.apache.lucene.index.IndexWriterConfig.OpenMode;
import org.apache.lucene.index.Term;
import org.apache.lucene.queryparser.classic.ParseException;
import org.apache.lucene.queryparser.classic.QueryParser;
import org.apache.lucene.search.BooleanClause.Occur;
import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.NumericRangeQuery;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.store.FSDirectory;
import org.apache.lucene.util.Version;
public class LuceneDemo {
private static final String ID1 = "Great#text";
private static final String ID2 = "Another#bonus";
private static final String METHOD_NAME_FIELD = "method_name";
private static final String NUMBER_OF_ARGUMENTS = "number_of_arguments";
private static final String CONTEXT_FIELD = "context";
/** Parser used to parse queries */
private static QueryParser parser = new QueryParser(Version.LUCENE_43,
METHOD_NAME_FIELD, createDefaultAnalyzer());
public static void main(String[] args) throws IOException, ParseException {
IndexWriter luceneIndexWriter = new IndexWriter(
FSDirectory.open(new File("/tmp/test")), createWriterConfig(64));
Document doc1 = createDocument(ID1, "context1", 1);
luceneIndexWriter.addDocument(doc1);
Document doc2 = createDocument(ID2, "context2", 2);
luceneIndexWriter.addDocument(doc2);
System.out.println("Found doc1: "
+ findDocument(ID1, 1, luceneIndexWriter));
System.out.println("Found doc2: "
+ findDocument(ID2, 2, luceneIndexWriter));
doc1 = findDocument(ID1, 1, luceneIndexWriter);
// Section 1
doc1.removeField(CONTEXT_FIELD);
doc1.add(new TextField(CONTEXT_FIELD, "context1_changed",
Field.Store.YES));
luceneIndexWriter.updateDocument(new Term(METHOD_NAME_FIELD, "text"),
doc1);
System.out.println("Found doc1: "
+ findDocument(ID1, 1, luceneIndexWriter));
System.out.println("Found doc2: "
+ findDocument(ID2, 2, luceneIndexWriter));
// Section 2
// doc1 = findDocument(ID1, 1, luceneIndexWriter); <- null
doc1.removeField(CONTEXT_FIELD);
doc1.add(new TextField(CONTEXT_FIELD, "context1_changed2",
Field.Store.YES));
luceneIndexWriter.updateDocument(new Term(METHOD_NAME_FIELD, "text"),
doc1);
System.out.println("Found doc1: "
+ findDocument(ID1, 1, luceneIndexWriter));
System.out.println("Found doc2: "
+ findDocument(ID2, 2, luceneIndexWriter));
luceneIndexWriter.close();
}
private static Document createDocument(String id, String context, int value) {
Document doc = new Document();
doc.add(new TextField(METHOD_NAME_FIELD, id, Field.Store.YES));
doc.add(new TextField(CONTEXT_FIELD, context, Field.Store.YES));
doc.add(new IntField(NUMBER_OF_ARGUMENTS, value, Field.Store.YES));
return doc;
}
private static Document findDocument(String id, int value,
IndexWriter luceneIndexWriter) throws IOException, ParseException {
DirectoryReader reader = DirectoryReader.open(luceneIndexWriter, true);
IndexSearcher searcher = new IndexSearcher(reader);
String[] split = id.split("#");
Query methodQuery = parser.parse(split[1]);
Query classQuery = parser.parse(split[0]);
NumericRangeQuery<Integer> range = NumericRangeQuery.newIntRange(
NUMBER_OF_ARGUMENTS, 1, value, value, true, true);
BooleanQuery query = new BooleanQuery();
query.add(methodQuery, Occur.MUST);
query.add(classQuery, Occur.MUST);
query.add(range, Occur.MUST);
TopDocs result = searcher.search(query, 1);
if (result.totalHits == 0) {
System.err.println("Problem, nothing found (Method: " + id + ")");
return null;
}
Document document = searcher.doc(result.scoreDocs[0].doc);
if (document.get(METHOD_NAME_FIELD).equals(id)) {
return document;
}
return null;
}
/** create the analyzer used */
private static Analyzer createDefaultAnalyzer() {
Map<String, Analyzer> analyzerPerField = new HashMap<String, Analyzer>();
analyzerPerField.put(NUMBER_OF_ARGUMENTS, new KeywordAnalyzer());
PerFieldAnalyzerWrapper analyzer = new PerFieldAnalyzerWrapper(
new SimpleAnalyzer(Version.LUCENE_43), analyzerPerField);
return analyzer;
}
/** Creates the configuration used for writing. */
public static IndexWriterConfig createWriterConfig(double ramBufferSizeMB) {
IndexWriterConfig config = new IndexWriterConfig(Version.LUCENE_43,
createDefaultAnalyzer());
config.setRAMBufferSizeMB(ramBufferSizeMB);
config.setOpenMode(OpenMode.CREATE_OR_APPEND);
config.setMaxBufferedDeleteTerms(1); // desperate try at
config.setMaxBufferedDocs(2); // storing everything correctly right away
// config.setInfoStream(System.out); <- set this for more output
return config;
}
}
出力:
Found doc1: Document<stored,indexed,tokenized<method_name:Great#text> stored,indexed,tokenized<context:context1> stored<number_of_arguments:1>>
Found doc2: Document<stored,indexed,tokenized<method_name:Another#bonus> stored,indexed,tokenized<context:context2> stored<number_of_arguments:2>>
Problem, nothing found (Method: Great#text)
Found doc1: null
Found doc2: Document<stored,indexed,tokenized<method_name:Another#bonus> stored,indexed,tokenized<context:context2> stored<number_of_arguments:2>>
Problem, nothing found (Method: Great#text)
Found doc1: null
Found doc2: Document<stored,indexed,tokenized<method_name:Another#bonus> stored,indexed,tokenized<context:context2> stored<number_of_arguments:2>>
config.setInfoStream(System.out) を含む出力:
http://bpaste.net/show/ko8kkxeFxZFE26NuecZc/ (ここに含めるには長すぎます。申し訳ありません)