X-Git-Url: https://git.mdrn.pl/pylucene.git/blobdiff_plain/a2e61f0c04805cfcb8706176758d1283c7e3a55c..aaeed5504b982cf3545252ab528713250aa33eed:/lucene-java-3.5.0/lucene/backwards/src/test/org/apache/lucene/index/TestTermdocPerf.java diff --git a/lucene-java-3.5.0/lucene/backwards/src/test/org/apache/lucene/index/TestTermdocPerf.java b/lucene-java-3.5.0/lucene/backwards/src/test/org/apache/lucene/index/TestTermdocPerf.java new file mode 100644 index 0000000..6d82f49 --- /dev/null +++ b/lucene-java-3.5.0/lucene/backwards/src/test/org/apache/lucene/index/TestTermdocPerf.java @@ -0,0 +1,137 @@ +package org.apache.lucene.index; + +/** + * Copyright 2006 The Apache Software Foundation + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + + +import java.io.IOException; +import java.io.Reader; +import java.util.Random; + +import org.apache.lucene.analysis.Analyzer; +import org.apache.lucene.analysis.ReusableAnalyzerBase; +import org.apache.lucene.analysis.TokenStream; +import org.apache.lucene.analysis.Tokenizer; +import org.apache.lucene.analysis.tokenattributes.CharTermAttribute; +import org.apache.lucene.document.Document; +import org.apache.lucene.document.Field; +import org.apache.lucene.index.IndexWriterConfig.OpenMode; +import org.apache.lucene.store.Directory; +import org.apache.lucene.util.LuceneTestCase; + +class RepeatingTokenStream extends Tokenizer { + + private final Random random; + private final float percentDocs; + private final int maxTF; + private int num; + CharTermAttribute termAtt; + String value; + + public RepeatingTokenStream(String val, Random random, float percentDocs, int maxTF) { + this.value = val; + this.random = random; + this.percentDocs = percentDocs; + this.maxTF = maxTF; + this.termAtt = addAttribute(CharTermAttribute.class); + } + + @Override + public boolean incrementToken() throws IOException { + num--; + if (num >= 0) { + clearAttributes(); + termAtt.append(value); + return true; + } + return false; + } + + @Override + public void reset() throws IOException { + super.reset(); + if (random.nextFloat() < percentDocs) { + num = random.nextInt(maxTF) + 1; + } else { + num = 0; + } + } +} + + +public class TestTermdocPerf extends LuceneTestCase { + + void addDocs(final Random random, Directory dir, final int ndocs, String field, final String val, final int maxTF, final float percentDocs) throws IOException { + final RepeatingTokenStream ts = new RepeatingTokenStream(val, random, percentDocs, maxTF); + + Analyzer analyzer = new Analyzer() { + @Override + public TokenStream tokenStream(String fieldName, Reader reader) { + return ts; + } + }; + + Document doc = new Document(); + doc.add(newField(field,val, Field.Store.NO, Field.Index.NOT_ANALYZED_NO_NORMS)); + IndexWriter writer = new IndexWriter(dir, newIndexWriterConfig( + TEST_VERSION_CURRENT, analyzer) + .setOpenMode(OpenMode.CREATE).setMaxBufferedDocs(100)); + ((LogMergePolicy) writer.getConfig().getMergePolicy()).setMergeFactor(100); + + for (int i=0; i