geode-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From ash...@apache.org
Subject incubator-geode git commit: GEODE-11: Add test to compare inter-buckets scores
Date Thu, 01 Oct 2015 03:12:07 GMT
Repository: incubator-geode
Updated Branches:
  refs/heads/feature/GEODE-11 8fa82ab50 -> 75abaf5ad


GEODE-11: Add test to compare inter-buckets scores


Project: http://git-wip-us.apache.org/repos/asf/incubator-geode/repo
Commit: http://git-wip-us.apache.org/repos/asf/incubator-geode/commit/75abaf5a
Tree: http://git-wip-us.apache.org/repos/asf/incubator-geode/tree/75abaf5a
Diff: http://git-wip-us.apache.org/repos/asf/incubator-geode/diff/75abaf5a

Branch: refs/heads/feature/GEODE-11
Commit: 75abaf5adfbdbf23bbc8f1542be4001eec2a7176
Parents: 8fa82ab
Author: Ashvin Agrawal <ashvin@apache.org>
Authored: Wed Sep 30 15:33:53 2015 -0700
Committer: Ashvin Agrawal <ashvin@apache.org>
Committed: Wed Sep 30 20:10:54 2015 -0700

----------------------------------------------------------------------
 .../DistributedScoringJUnitTest.java            | 136 +++++++++++++++++++
 1 file changed, 136 insertions(+)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/incubator-geode/blob/75abaf5a/gemfire-lucene/src/test/java/com/gemstone/gemfire/cache/lucene/internal/distributed/DistributedScoringJUnitTest.java
----------------------------------------------------------------------
diff --git a/gemfire-lucene/src/test/java/com/gemstone/gemfire/cache/lucene/internal/distributed/DistributedScoringJUnitTest.java
b/gemfire-lucene/src/test/java/com/gemstone/gemfire/cache/lucene/internal/distributed/DistributedScoringJUnitTest.java
new file mode 100644
index 0000000..d18c520
--- /dev/null
+++ b/gemfire-lucene/src/test/java/com/gemstone/gemfire/cache/lucene/internal/distributed/DistributedScoringJUnitTest.java
@@ -0,0 +1,136 @@
+package com.gemstone.gemfire.cache.lucene.internal.distributed;
+
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.Iterator;
+import java.util.List;
+import java.util.concurrent.ConcurrentHashMap;
+
+import org.apache.lucene.analysis.standard.StandardAnalyzer;
+import org.apache.lucene.index.IndexWriter;
+import org.apache.lucene.index.IndexWriterConfig;
+import org.apache.lucene.queryparser.classic.QueryParser;
+import org.apache.lucene.search.Query;
+import org.junit.Assert;
+import org.junit.Before;
+import org.junit.Test;
+import org.junit.experimental.categories.Category;
+import org.mockito.Mockito;
+
+import com.gemstone.gemfire.cache.Region;
+import com.gemstone.gemfire.cache.lucene.internal.directory.RegionDirectory;
+import com.gemstone.gemfire.cache.lucene.internal.filesystem.ChunkKey;
+import com.gemstone.gemfire.cache.lucene.internal.filesystem.File;
+import com.gemstone.gemfire.cache.lucene.internal.repository.IndexRepositoryImpl;
+import com.gemstone.gemfire.cache.lucene.internal.repository.serializer.HeterogenousLuceneSerializer;
+import com.gemstone.gemfire.test.junit.categories.UnitTest;
+
+@Category(UnitTest.class)
+public class DistributedScoringJUnitTest {
+  class TestType {
+    String txt;
+
+    public TestType(String txt) {
+      this.txt = txt;
+    }
+  }
+
+  String[] indexedFields = new String[] { "txt" };
+  HeterogenousLuceneSerializer mapper = new HeterogenousLuceneSerializer(indexedFields);
+
+  final StandardAnalyzer analyzer = new StandardAnalyzer();
+  Region<String, String> region;
+
+  @Before
+  public void createMocks() {
+    region = Mockito.mock(Region.class);
+    Mockito.when(region.isDestroyed()).thenReturn(false);
+  }
+
+  /*
+   * The goal of this test is to verify fair scoring if entries are uniformly distributed.
It compares ordered results
+   * from a single IndexRepository (IR) with merged-ordered results from multiple repositories
(ir1, ir2, ir3). The
+   * records inserted in IR are same as the combined records in irX. This simulates merging
of results from buckets of a
+   * region.
+   */
+  @Test
+  public void uniformDistributionProducesComparableScores() throws Exception {
+    // the strings below have been grouped to be split between three index repositories
+    String[] testStrings = {
+        "hello world",
+        "foo bar",
+        "just any string",
+
+        "hello world is usually the first program",
+        "water on mars",
+        "test world",
+
+        "hello",
+        "test hello test",
+        "find the aliens", };
+
+    QueryParser parser = new QueryParser("txt", analyzer);
+    Query query = parser.parse("hello world");
+
+    IndexRepositoryImpl singleIndexRepo = createIndexRepo();
+    populateIndex(testStrings, singleIndexRepo, 0, testStrings.length);
+
+    TopEntriesCollector collector = new TopEntriesCollector();
+    singleIndexRepo.query(query, 100, collector);
+    List<EntryScore> singleResult = collector.getEntries().getHits();
+
+    IndexRepositoryImpl distIR1 = createIndexRepo();
+    populateIndex(testStrings, distIR1, 0, testStrings.length / 3);
+
+    IndexRepositoryImpl distIR2 = createIndexRepo();
+    populateIndex(testStrings, distIR2, testStrings.length / 3, (testStrings.length * 2)
/ 3);
+
+    IndexRepositoryImpl distIR3 = createIndexRepo();
+    populateIndex(testStrings, distIR3, (testStrings.length * 2) / 3, testStrings.length);
+
+    ArrayList<TopEntriesCollector> collectors = new ArrayList<>();
+    TopEntriesCollectorManager manager = new TopEntriesCollectorManager();
+
+    TopEntriesCollector collector1 = manager.newCollector("");
+    distIR1.query(query, 100, collector1);
+    collectors.add(collector1);
+
+    TopEntriesCollector collector2 = manager.newCollector("");
+    distIR2.query(query, 100, collector2);
+    collectors.add(collector2);
+
+    TopEntriesCollector collector3 = manager.newCollector("");
+    distIR3.query(query, 100, collector3);
+    collectors.add(collector3);
+
+    List<EntryScore> distResult = manager.reduce(collectors).getEntries().getHits();
+    
+    Assert.assertEquals(singleResult.size(), distResult.size());
+    Assert.assertTrue(singleResult.size() > 0);
+    
+    for (Iterator single = distResult.iterator(), dist = singleResult.iterator(); single.hasNext()
&& dist.hasNext();) {
+      EntryScore singleScore = (EntryScore) single.next();
+      EntryScore distScore = (EntryScore) dist.next();
+      Assert.assertEquals(singleScore.getKey(), distScore.getKey());
+    }
+  }
+
+  private void populateIndex(String[] testStrings, IndexRepositoryImpl repo, int start, int
end) throws IOException {
+    for (int i = start; i < end; i++) {
+      String key = "key-" + i;
+      repo.create(key, new TestType(testStrings[i]));
+    }
+    repo.commit();
+  }
+
+  private IndexRepositoryImpl createIndexRepo() throws IOException {
+    ConcurrentHashMap<String, File> fileRegion = new ConcurrentHashMap<String, File>();
+    ConcurrentHashMap<ChunkKey, byte[]> chunkRegion = new ConcurrentHashMap<ChunkKey,
byte[]>();
+    RegionDirectory dir = new RegionDirectory(fileRegion, chunkRegion);
+
+    IndexWriterConfig config = new IndexWriterConfig(analyzer);
+    IndexWriter writer = new IndexWriter(dir, config);
+
+    return new IndexRepositoryImpl(region, writer, mapper);
+  }
+}
\ No newline at end of file


Mime
View raw message