lucene-java-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From yo...@apache.org
Subject svn commit: r428488 - /lucene/java/trunk/src/test/org/apache/lucene/index/TestTermdocPerf.java
Date Thu, 03 Aug 2006 19:26:49 GMT
Author: yonik
Date: Thu Aug  3 12:26:48 2006
New Revision: 428488

URL: http://svn.apache.org/viewvc?rev=428488&view=rev
Log:
performance test for TermDoc iteration speed

Added:
    lucene/java/trunk/src/test/org/apache/lucene/index/TestTermdocPerf.java

Added: lucene/java/trunk/src/test/org/apache/lucene/index/TestTermdocPerf.java
URL: http://svn.apache.org/viewvc/lucene/java/trunk/src/test/org/apache/lucene/index/TestTermdocPerf.java?rev=428488&view=auto
==============================================================================
--- lucene/java/trunk/src/test/org/apache/lucene/index/TestTermdocPerf.java (added)
+++ lucene/java/trunk/src/test/org/apache/lucene/index/TestTermdocPerf.java Thu Aug  3 12:26:48
2006
@@ -0,0 +1,115 @@
+package org.apache.lucene.index;
+
+/**
+ * Copyright 2006 The Apache Software Foundation
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+
+import junit.framework.TestCase;
+import org.apache.lucene.store.Directory;
+import org.apache.lucene.store.RAMDirectory;
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Token;
+import org.apache.lucene.document.Document;
+import org.apache.lucene.document.Field;
+
+import java.io.Reader;
+import java.io.IOException;
+import java.util.Random;
+
+/**
+ * @author yonik
+ * @version $Id$
+ */
+
+class RepeatingTokenStream extends TokenStream {
+  public int num;
+  Token t;
+
+   public RepeatingTokenStream(String val) {
+     t = new Token(val,0,val.length());
+   }
+
+   public Token next() throws IOException {
+     return --num<0 ? null : t;
+   }
+}
+
+
+public class TestTermdocPerf extends TestCase {
+
+  void addDocs(Directory dir, final int ndocs, String field, final String val, final int
maxTF, final float percentDocs) throws IOException {
+    final Random random = new Random(0);
+    final RepeatingTokenStream ts = new RepeatingTokenStream(val);
+
+    Analyzer analyzer = new Analyzer() {
+      public TokenStream tokenStream(String fieldName, Reader reader) {
+        if (random.nextFloat() < percentDocs) ts.num = random.nextInt(maxTF)+1;
+        else ts.num=0;
+        return ts;
+      }
+    };
+
+    Document doc = new Document();
+    doc.add(new Field(field,val, Field.Store.NO, Field.Index.NO_NORMS));
+    IndexWriter writer = new IndexWriter(dir, analyzer, true);
+    writer.setMaxBufferedDocs(100);
+    writer.setMergeFactor(100);
+
+    for (int i=0; i<ndocs; i++) {
+      writer.addDocument(doc);
+    }
+
+    writer.optimize();
+    writer.close();
+  }
+
+
+  public int doTest(int iter, int ndocs, int maxTF, float percentDocs) throws IOException
{
+    Directory dir = new RAMDirectory();
+
+    long start = System.currentTimeMillis();
+    addDocs(dir, ndocs, "foo", "val", maxTF, percentDocs);
+    long end = System.currentTimeMillis();
+    System.out.println("milliseconds for creation of " + ndocs + " docs = " + (end-start));
+
+    IndexReader reader = IndexReader.open(dir);
+    TermEnum tenum = reader.terms(new Term("foo","val"));
+    TermDocs tdocs = reader.termDocs();
+
+    start = System.currentTimeMillis();
+
+    int ret=0;
+    for (int i=0; i<iter; i++) {
+      tdocs.seek(tenum);
+      while (tdocs.next()) {
+        ret += tdocs.doc();
+      }
+    }
+
+    end = System.currentTimeMillis();
+    System.out.println("milliseconds for " + iter + " TermDocs iteration: " + (end-start));
+
+    return ret;
+  }
+
+  public void testTermDocPerf() throws IOException {
+    // performance test for 10% of documents containing a term
+    // doTest(100000, 10000,3,.1f);
+  }
+
+
+}



Mime
View raw message