+++ /dev/null
-package org.apache.lucene.search.regex;
-
-/**
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements. See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License. You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-import java.io.IOException;
-
-import org.apache.lucene.analysis.MockAnalyzer;
-import org.apache.lucene.document.Document;
-import org.apache.lucene.document.Field;
-import org.apache.lucene.index.CorruptIndexException;
-import org.apache.lucene.index.IndexWriter;
-import org.apache.lucene.index.Term;
-import org.apache.lucene.index.IndexWriterConfig.OpenMode;
-import org.apache.lucene.search.IndexSearcher;
-import org.apache.lucene.search.MultiSearcher;
-import org.apache.lucene.search.spans.SpanFirstQuery;
-import org.apache.lucene.search.spans.SpanMultiTermQueryWrapper;
-import org.apache.lucene.search.spans.SpanNearQuery;
-import org.apache.lucene.search.spans.SpanQuery;
-import org.apache.lucene.store.Directory;
-import org.apache.lucene.store.LockObtainFailedException;
-import org.apache.lucene.util.LuceneTestCase;
-
-public class TestSpanRegexQuery extends LuceneTestCase {
-
- Directory indexStoreA;
- Directory indexStoreB;
-
- @Override
- public void setUp() throws Exception {
- super.setUp();
- indexStoreA = newDirectory();
- indexStoreB = newDirectory();
- }
-
- @Override
- public void tearDown() throws Exception {
- indexStoreA.close();
- indexStoreB.close();
- super.tearDown();
- }
-
- public void testSpanRegex() throws Exception {
- Directory directory = newDirectory();
- IndexWriter writer = new IndexWriter(directory, newIndexWriterConfig(
- TEST_VERSION_CURRENT, new MockAnalyzer(random)));
- Document doc = new Document();
- // doc.add(newField("field", "the quick brown fox jumps over the lazy dog",
- // Field.Store.NO, Field.Index.ANALYZED));
- // writer.addDocument(doc);
- // doc = new Document();
- doc.add(newField("field", "auto update", Field.Store.NO,
- Field.Index.ANALYZED));
- writer.addDocument(doc);
- doc = new Document();
- doc.add(newField("field", "first auto update", Field.Store.NO,
- Field.Index.ANALYZED));
- writer.addDocument(doc);
- writer.optimize();
- writer.close();
-
- IndexSearcher searcher = new IndexSearcher(directory, true);
- SpanQuery srq = new SpanMultiTermQueryWrapper<RegexQuery>(new RegexQuery(new Term("field", "aut.*")));
- SpanFirstQuery sfq = new SpanFirstQuery(srq, 1);
- // SpanNearQuery query = new SpanNearQuery(new SpanQuery[] {srq, stq}, 6,
- // true);
- int numHits = searcher.search(sfq, null, 1000).totalHits;
- assertEquals(1, numHits);
- searcher.close();
- directory.close();
- }
-
- public void testSpanRegexBug() throws CorruptIndexException, IOException {
- createRAMDirectories();
-
- SpanQuery srq = new SpanMultiTermQueryWrapper<RegexQuery>(new RegexQuery(new Term("field", "a.*")));
- SpanQuery stq = new SpanMultiTermQueryWrapper<RegexQuery>(new RegexQuery(new Term("field", "b.*")));
- SpanNearQuery query = new SpanNearQuery(new SpanQuery[] { srq, stq }, 6,
- true);
-
- // 1. Search the same store which works
- IndexSearcher[] arrSearcher = new IndexSearcher[2];
- arrSearcher[0] = new IndexSearcher(indexStoreA, true);
- arrSearcher[1] = new IndexSearcher(indexStoreB, true);
- MultiSearcher searcher = new MultiSearcher(arrSearcher);
- int numHits = searcher.search(query, null, 1000).totalHits;
- arrSearcher[0].close();
- arrSearcher[1].close();
-
- // Will fail here
- // We expect 2 but only one matched
- // The rewriter function only write it once on the first IndexSearcher
- // So it's using term: a1 b1 to search on the second IndexSearcher
- // As a result, it won't match the document in the second IndexSearcher
- assertEquals(2, numHits);
- }
-
- /** remove in lucene 4.0 */
- @Deprecated
- public void testSpanRegexOld() throws Exception {
- Directory directory = newDirectory();
- IndexWriter writer = new IndexWriter(directory, newIndexWriterConfig(
- TEST_VERSION_CURRENT, new MockAnalyzer(random)));
- Document doc = new Document();
- // doc.add(newField("field", "the quick brown fox jumps over the lazy dog",
- // Field.Store.NO, Field.Index.ANALYZED));
- // writer.addDocument(doc);
- // doc = new Document();
- doc.add(newField("field", "auto update", Field.Store.NO,
- Field.Index.ANALYZED));
- writer.addDocument(doc);
- doc = new Document();
- doc.add(newField("field", "first auto update", Field.Store.NO,
- Field.Index.ANALYZED));
- writer.addDocument(doc);
- writer.optimize();
- writer.close();
-
- IndexSearcher searcher = new IndexSearcher(directory, true);
- SpanRegexQuery srq = new SpanRegexQuery(new Term("field", "aut.*"));
- SpanFirstQuery sfq = new SpanFirstQuery(srq, 1);
- // SpanNearQuery query = new SpanNearQuery(new SpanQuery[] {srq, stq}, 6,
- // true);
- int numHits = searcher.search(sfq, null, 1000).totalHits;
- assertEquals(1, numHits);
- searcher.close();
- directory.close();
- }
-
- /** remove in lucene 4.0 */
- @Deprecated
- public void testSpanRegexBugOld() throws CorruptIndexException, IOException {
- createRAMDirectories();
-
- SpanRegexQuery srq = new SpanRegexQuery(new Term("field", "a.*"));
- SpanRegexQuery stq = new SpanRegexQuery(new Term("field", "b.*"));
- SpanNearQuery query = new SpanNearQuery(new SpanQuery[] { srq, stq }, 6,
- true);
-
- // 1. Search the same store which works
- IndexSearcher[] arrSearcher = new IndexSearcher[2];
- arrSearcher[0] = new IndexSearcher(indexStoreA, true);
- arrSearcher[1] = new IndexSearcher(indexStoreB, true);
- MultiSearcher searcher = new MultiSearcher(arrSearcher);
- int numHits = searcher.search(query, null, 1000).totalHits;
- arrSearcher[0].close();
- arrSearcher[1].close();
-
- // Will fail here
- // We expect 2 but only one matched
- // The rewriter function only write it once on the first IndexSearcher
- // So it's using term: a1 b1 to search on the second IndexSearcher
- // As a result, it won't match the document in the second IndexSearcher
- assertEquals(2, numHits);
- }
-
- private void createRAMDirectories() throws CorruptIndexException,
- LockObtainFailedException, IOException {
- // creating a document to store
- Document lDoc = new Document();
- lDoc.add(newField("field", "a1 b1", Field.Store.NO,
- Field.Index.ANALYZED_NO_NORMS));
-
- // creating a document to store
- Document lDoc2 = new Document();
- lDoc2.add(newField("field", "a2 b2", Field.Store.NO,
- Field.Index.ANALYZED_NO_NORMS));
-
- // creating first index writer
- IndexWriter writerA = new IndexWriter(indexStoreA, newIndexWriterConfig(
- TEST_VERSION_CURRENT, new MockAnalyzer(random)).setOpenMode(OpenMode.CREATE));
- writerA.addDocument(lDoc);
- writerA.optimize();
- writerA.close();
-
- // creating second index writer
- IndexWriter writerB = new IndexWriter(indexStoreB, newIndexWriterConfig(
- TEST_VERSION_CURRENT, new MockAnalyzer(random)).setOpenMode(OpenMode.CREATE));
- writerB.addDocument(lDoc2);
- writerB.optimize();
- writerB.close();
- }
-}