--- /dev/null
+package org.apache.lucene.index;
+
+/**
+ * Copyright 2006 The Apache Software Foundation
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+
+import java.io.IOException;
+import java.io.Reader;
+import java.util.Random;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.ReusableAnalyzerBase;
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
+import org.apache.lucene.document.Document;
+import org.apache.lucene.document.Field;
+import org.apache.lucene.index.IndexWriterConfig.OpenMode;
+import org.apache.lucene.store.Directory;
+import org.apache.lucene.util.LuceneTestCase;
+
+class RepeatingTokenStream extends Tokenizer {
+
+ private final Random random;
+ private final float percentDocs;
+ private final int maxTF;
+ private int num;
+ CharTermAttribute termAtt;
+ String value;
+
+ public RepeatingTokenStream(String val, Random random, float percentDocs, int maxTF) {
+ this.value = val;
+ this.random = random;
+ this.percentDocs = percentDocs;
+ this.maxTF = maxTF;
+ this.termAtt = addAttribute(CharTermAttribute.class);
+ }
+
+ @Override
+ public boolean incrementToken() throws IOException {
+ num--;
+ if (num >= 0) {
+ clearAttributes();
+ termAtt.append(value);
+ return true;
+ }
+ return false;
+ }
+
+ @Override
+ public void reset() throws IOException {
+ super.reset();
+ if (random.nextFloat() < percentDocs) {
+ num = random.nextInt(maxTF) + 1;
+ } else {
+ num = 0;
+ }
+ }
+}
+
+
+public class TestTermdocPerf extends LuceneTestCase {
+
+ void addDocs(final Random random, Directory dir, final int ndocs, String field, final String val, final int maxTF, final float percentDocs) throws IOException {
+ final RepeatingTokenStream ts = new RepeatingTokenStream(val, random, percentDocs, maxTF);
+
+ Analyzer analyzer = new Analyzer() {
+ @Override
+ public TokenStream tokenStream(String fieldName, Reader reader) {
+ return ts;
+ }
+ };
+
+ Document doc = new Document();
+ doc.add(newField(field,val, Field.Store.NO, Field.Index.NOT_ANALYZED_NO_NORMS));
+ IndexWriter writer = new IndexWriter(dir, newIndexWriterConfig(
+ TEST_VERSION_CURRENT, analyzer)
+ .setOpenMode(OpenMode.CREATE).setMaxBufferedDocs(100));
+ ((LogMergePolicy) writer.getConfig().getMergePolicy()).setMergeFactor(100);
+
+ for (int i=0; i<ndocs; i++) {
+ writer.addDocument(doc);
+ }
+
+ writer.optimize();
+ writer.close();
+ }
+
+
+ public int doTest(int iter, int ndocs, int maxTF, float percentDocs) throws IOException {
+ Directory dir = newDirectory();
+
+ long start = System.currentTimeMillis();
+ addDocs(random, dir, ndocs, "foo", "val", maxTF, percentDocs);
+ long end = System.currentTimeMillis();
+ if (VERBOSE) System.out.println("milliseconds for creation of " + ndocs + " docs = " + (end-start));
+
+ IndexReader reader = IndexReader.open(dir, true);
+ TermEnum tenum = reader.terms(new Term("foo","val"));
+ TermDocs tdocs = reader.termDocs();
+
+ start = System.currentTimeMillis();
+
+ int ret=0;
+ for (int i=0; i<iter; i++) {
+ tdocs.seek(tenum);
+ while (tdocs.next()) {
+ ret += tdocs.doc();
+ }
+ }
+
+ end = System.currentTimeMillis();
+ if (VERBOSE) System.out.println("milliseconds for " + iter + " TermDocs iteration: " + (end-start));
+
+ return ret;
+ }
+
+ public void testTermDocPerf() throws IOException {
+ // performance test for 10% of documents containing a term
+ // doTest(100000, 10000,3,.1f);
+ }
+
+
+}