hadoop-common-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From jl...@apache.org
Subject svn commit: r1528620 - in /hadoop/common/trunk/hadoop-common-project/hadoop-common: ./ src/test/java/org/apache/hadoop/util/bloom/ src/test/java/org/apache/hadoop/util/hash/
Date Wed, 02 Oct 2013 20:50:43 GMT
Author: jlowe
Date: Wed Oct  2 20:50:42 2013
New Revision: 1528620

URL: http://svn.apache.org/r1528620
Log:
HADOOP-9254. Cover packages org.apache.hadoop.util.bloom, org.apache.hadoop.util.hash. Contributed
by Vadim Bondarev

Added:
    hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/
    hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/BloomFilterCommonTester.java
  (with props)
    hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/TestBloomFilters.java
  (with props)
    hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/hash/
    hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/hash/TestHash.java
  (with props)
Modified:
    hadoop/common/trunk/hadoop-common-project/hadoop-common/CHANGES.txt

Modified: hadoop/common/trunk/hadoop-common-project/hadoop-common/CHANGES.txt
URL: http://svn.apache.org/viewvc/hadoop/common/trunk/hadoop-common-project/hadoop-common/CHANGES.txt?rev=1528620&r1=1528619&r2=1528620&view=diff
==============================================================================
--- hadoop/common/trunk/hadoop-common-project/hadoop-common/CHANGES.txt (original)
+++ hadoop/common/trunk/hadoop-common-project/hadoop-common/CHANGES.txt Wed Oct  2 20:50:42
2013
@@ -342,6 +342,9 @@ Release 2.3.0 - UNRELEASED
     HADOOP-9063. enhance unit-test coverage of class
     org.apache.hadoop.fs.FileUtil (Ivan A. Veselovsky via jlowe)
 
+    HADOOP-9254. Cover packages org.apache.hadoop.util.bloom,
+    org.apache.hadoop.util.hash (Vadim Bondarev via jlowe)
+
   OPTIMIZATIONS
 
     HADOOP-9748. Reduce blocking on UGI.ensureInitialized (daryn)

Added: hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/BloomFilterCommonTester.java
URL: http://svn.apache.org/viewvc/hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/BloomFilterCommonTester.java?rev=1528620&view=auto
==============================================================================
--- hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/BloomFilterCommonTester.java
(added)
+++ hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/BloomFilterCommonTester.java
Wed Oct  2 20:50:42 2013
@@ -0,0 +1,533 @@
+package org.apache.hadoop.util.bloom;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import static org.junit.Assert.assertFalse;
+import static org.junit.Assert.assertTrue;
+
+import java.io.IOException;
+import java.util.AbstractCollection;
+import java.util.Collection;
+import java.util.Iterator;
+import java.util.Random;
+
+import org.junit.Assert;
+import org.apache.hadoop.io.DataInputBuffer;
+import org.apache.hadoop.io.DataOutputBuffer;
+import org.apache.hadoop.util.hash.Hash;
+import org.apache.log4j.Logger;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableSet;
+
+public class BloomFilterCommonTester<T extends Filter> {
+
+  private static final double LN2 = Math.log(2);
+  private static final double LN2_SQUARED = LN2 * LN2;
+
+  private final int hashType;
+  private final int numInsertions;
+
+  private final ImmutableList.Builder<T> builder = ImmutableList.builder();
+
+  private ImmutableSet<BloomFilterTestStrategy> filterTestStrateges;
+
+  private final PreAssertionHelper preAssertionHelper;
+
+  static int optimalNumOfBits(int n, double p) {
+    return (int) (-n * Math.log(p) / LN2_SQUARED);
+  }
+  
+  public static <T extends Filter> BloomFilterCommonTester<T> of(int hashId,
+      int numInsertions) {
+    return new BloomFilterCommonTester<T>(hashId, numInsertions);
+  }
+
+  public BloomFilterCommonTester<T> withFilterInstance(T filter) {
+    builder.add(filter);
+    return this;
+  }
+
+  private BloomFilterCommonTester(int hashId, int numInsertions) {
+    this.hashType = hashId;
+    this.numInsertions = numInsertions;
+
+    this.preAssertionHelper = new PreAssertionHelper() {
+
+      @Override
+      public ImmutableSet<Integer> falsePositives(int hashId) {
+        switch (hashId) {
+        case Hash.JENKINS_HASH: {
+          // // false pos for odd and event under 1000
+          return ImmutableSet.of(99, 963);
+        }
+        case Hash.MURMUR_HASH: {
+          // false pos for odd and event under 1000
+          return ImmutableSet.of(769, 772, 810, 874);
+        }
+        default: {
+          // fail fast with unknown hash error !!!
+          Assert.assertFalse("unknown hash error", true);
+          return ImmutableSet.of();
+        }
+        }
+      }
+    };
+  }
+
+  public BloomFilterCommonTester<T> withTestCases(
+      ImmutableSet<BloomFilterTestStrategy> filterTestStrateges) {
+    this.filterTestStrateges = ImmutableSet.copyOf(filterTestStrateges);
+    return this;
+  }
+
+  @SuppressWarnings("unchecked")
+  public void test() {
+    final ImmutableList<T> filtersList = builder.build();
+    final ImmutableSet<Integer> falsePositives = preAssertionHelper
+        .falsePositives(hashType);
+
+    for (T filter : filtersList) {
+      for (BloomFilterTestStrategy strategy : filterTestStrateges) {
+        strategy.getStrategy().assertWhat(filter, numInsertions, hashType, falsePositives);
+        // create fresh instance for next test iteration 
+        filter = (T) getSymmetricFilter(filter.getClass(), numInsertions, hashType);    
           
+      }
+    }
+  }
+
+  interface FilterTesterStrategy {
+    final Logger logger = Logger.getLogger(FilterTesterStrategy.class);
+
+    void assertWhat(Filter filter, int numInsertions, int hashId,
+        ImmutableSet<Integer> falsePositives);
+  }
+
+  private static Filter getSymmetricFilter(Class<?> filterClass,
+      int numInsertions, int hashType) {
+    int bitSetSize = optimalNumOfBits(numInsertions, 0.03);
+    int hashFunctionNumber = 5; 
+    
+    if (filterClass == BloomFilter.class) {
+      return new BloomFilter(bitSetSize, hashFunctionNumber, hashType);
+    } else if (filterClass == CountingBloomFilter.class) {
+      return new CountingBloomFilter(bitSetSize, hashFunctionNumber, hashType);
+    } else if (filterClass == RetouchedBloomFilter.class) {
+      return new RetouchedBloomFilter(bitSetSize, hashFunctionNumber, hashType);
+    } else if (filterClass == DynamicBloomFilter.class) {
+      return new DynamicBloomFilter(bitSetSize, hashFunctionNumber, hashType, 3);
+    } else {
+      //fail fast
+      assertFalse("unexpected filterClass", true);
+      return null;
+    } 
+  }
+
+  public enum BloomFilterTestStrategy {
+
+    ADD_KEYS_STRATEGY(new FilterTesterStrategy() {
+
+      private final ImmutableList<Key> keys = ImmutableList.of(new Key(
+          new byte[] { 49, 48, 48 }), new Key(new byte[] { 50, 48, 48 }));
+
+      @Override
+      public void assertWhat(Filter filter, int numInsertions, int hashId,
+          ImmutableSet<Integer> falsePositives) {
+
+        filter.add(keys);
+
+        assertTrue(" might contain key error ",
+            filter.membershipTest(new Key("100".getBytes())));
+        assertTrue(" might contain key error ",
+            filter.membershipTest(new Key("200".getBytes())));
+
+        filter.add(keys.toArray(new Key[] {}));
+
+        assertTrue(" might contain key error ",
+            filter.membershipTest(new Key("100".getBytes())));
+        assertTrue(" might contain key error ",
+            filter.membershipTest(new Key("200".getBytes())));
+
+        filter.add(new AbstractCollection<Key>() {
+
+          @Override
+          public Iterator<Key> iterator() {
+            return keys.iterator();
+          }
+
+          @Override
+          public int size() {
+            return keys.size();
+          }
+
+        });
+
+        assertTrue(" might contain key error ",
+            filter.membershipTest(new Key("100".getBytes())));
+        assertTrue(" might contain key error ",
+            filter.membershipTest(new Key("200".getBytes())));
+      }
+    }),
+
+    KEY_TEST_STRATEGY(new FilterTesterStrategy() {
+
+      private void checkOnKeyMethods() {
+        String line = "werabsdbe";
+
+        Key key = new Key(line.getBytes());
+        assertTrue("default key weight error ", key.getWeight() == 1d);
+
+        key.set(line.getBytes(), 2d);
+        assertTrue(" setted key weight error ", key.getWeight() == 2d);
+
+        Key sKey = new Key(line.getBytes(), 2d);
+        assertTrue("equals error", key.equals(sKey));
+        assertTrue("hashcode error", key.hashCode() == sKey.hashCode());
+
+        sKey = new Key(line.concat("a").getBytes(), 2d);
+        assertFalse("equals error", key.equals(sKey));
+        assertFalse("hashcode error", key.hashCode() == sKey.hashCode());
+
+        sKey = new Key(line.getBytes(), 3d);
+        assertFalse("equals error", key.equals(sKey));
+        assertFalse("hashcode error", key.hashCode() == sKey.hashCode());
+
+        key.incrementWeight();
+        assertTrue("weight error", key.getWeight() == 3d);
+
+        key.incrementWeight(2d);
+        assertTrue("weight error", key.getWeight() == 5d);
+      }
+
+      private void checkOnReadWrite() {
+        String line = "qryqeb354645rghdfvbaq23312fg";
+        DataOutputBuffer out = new DataOutputBuffer();
+        DataInputBuffer in = new DataInputBuffer();
+        Key originKey = new Key(line.getBytes(), 100d);
+        try {
+          originKey.write(out);
+          in.reset(out.getData(), out.getData().length);
+          Key restoredKey = new Key(new byte[] { 0 });
+          assertFalse("checkOnReadWrite equals error", restoredKey.equals(originKey));
+          restoredKey.readFields(in);
+          assertTrue("checkOnReadWrite equals error", restoredKey.equals(originKey));
+          out.reset();
+        } catch (Exception ioe) {
+          Assert.fail("checkOnReadWrite ex error");
+        }
+      }
+
+      private void checkSetOnIAE() {
+        Key key = new Key();
+        try {
+          key.set(null, 0);
+        } catch (IllegalArgumentException ex) {
+          // expected
+        } catch (Exception e) {
+          Assert.fail("checkSetOnIAE ex error");
+        }
+      }
+
+      @Override
+      public void assertWhat(Filter filter, int numInsertions, int hashId,
+          ImmutableSet<Integer> falsePositives) {
+        checkOnKeyMethods();
+        checkOnReadWrite();
+        checkSetOnIAE();
+      }
+    }),
+
+    EXCEPTIONS_CHECK_STRATEGY(new FilterTesterStrategy() {
+
+      @Override
+      public void assertWhat(Filter filter, int numInsertions, int hashId,
+          ImmutableSet<Integer> falsePositives) {
+        checkAddOnNPE(filter);
+        checkTestMembershipOnNPE(filter);
+        checkAndOnIAE(filter);       
+      }
+
+      private void checkAndOnIAE(Filter filter) {
+        Filter tfilter = null;
+
+        try {
+          Collection<Key> keys = null;
+          filter.add(keys);
+        } catch (IllegalArgumentException ex) {
+          //
+        } catch (Exception e) {
+          Assert.fail("" + e);
+        }
+
+        try {
+          Key[] keys = null;
+          filter.add(keys);
+        } catch (IllegalArgumentException ex) {
+          //
+        } catch (Exception e) {
+          Assert.fail("" + e);
+        }
+
+        try {
+          ImmutableList<Key> keys = null;
+          filter.add(keys);
+        } catch (IllegalArgumentException ex) {
+          //
+        } catch (Exception e) {
+          Assert.fail("" + e);
+        }
+
+        try {
+          filter.and(tfilter);
+        } catch (IllegalArgumentException ex) {
+          // expected
+        } catch (Exception e) {
+          Assert.fail("" + e);
+        }
+
+        try {
+          filter.or(tfilter);
+        } catch (IllegalArgumentException ex) {
+          // expected
+        } catch (Exception e) {
+          Assert.fail("" + e);
+        }
+
+        try {
+          filter.xor(tfilter);
+        } catch (IllegalArgumentException ex) {
+          // expected
+        } catch (UnsupportedOperationException unex) {
+          //
+        } catch (Exception e) {
+          Assert.fail("" + e);
+        }
+
+      }
+
+      private void checkTestMembershipOnNPE(Filter filter) {
+        try {
+          Key nullKey = null;
+          filter.membershipTest(nullKey);
+        } catch (NullPointerException ex) {
+          // expected
+        } catch (Exception e) {
+          Assert.fail("" + e);
+        }
+      }
+
+      private void checkAddOnNPE(Filter filter) {
+        try {
+          Key nullKey = null;
+          filter.add(nullKey);
+        } catch (NullPointerException ex) {
+          // expected
+        } catch (Exception e) {
+          Assert.fail("" + e);
+        }
+      }
+    }),
+
+    ODD_EVEN_ABSENT_STRATEGY(new FilterTesterStrategy() {
+
+      @Override
+      public void assertWhat(Filter filter, int numInsertions, int hashId,
+          ImmutableSet<Integer> falsePositives) {
+
+        // add all even keys
+        for (int i = 0; i < numInsertions; i += 2) {
+          filter.add(new Key(Integer.toString(i).getBytes()));
+        }
+
+        // check on present even key
+        for (int i = 0; i < numInsertions; i += 2) {
+          Assert.assertTrue(" filter might contains " + i,
+              filter.membershipTest(new Key(Integer.toString(i).getBytes())));
+        }
+
+        // check on absent odd in event
+        for (int i = 1; i < numInsertions; i += 2) {
+          if (!falsePositives.contains(i)) {
+            assertFalse(" filter should not contain " + i,
+                filter.membershipTest(new Key(Integer.toString(i).getBytes())));
+          }
+        }
+      }
+    }),
+
+    WRITE_READ_STRATEGY(new FilterTesterStrategy() {
+
+      private int slotSize = 10;
+
+      @Override
+      public void assertWhat(Filter filter, int numInsertions, int hashId,
+          ImmutableSet<Integer> falsePositives) {
+
+        final Random rnd = new Random();
+        final DataOutputBuffer out = new DataOutputBuffer();
+        final DataInputBuffer in = new DataInputBuffer();
+        try {
+          Filter tempFilter = getSymmetricFilter(filter.getClass(),
+              numInsertions, hashId);
+          ImmutableList.Builder<Integer> blist = ImmutableList.builder();
+          for (int i = 0; i < slotSize; i++) {
+            blist.add(rnd.nextInt(numInsertions * 2));
+          }
+
+          ImmutableList<Integer> list = blist.build();
+
+          // mark bits for later check
+          for (Integer slot : list) {
+            filter.add(new Key(String.valueOf(slot).getBytes()));
+          }
+
+          filter.write(out);
+          in.reset(out.getData(), out.getLength());
+          tempFilter.readFields(in);
+
+          for (Integer slot : list) {
+            assertTrue("read/write mask check filter error on " + slot,
+                filter.membershipTest(new Key(String.valueOf(slot).getBytes())));
+          }
+
+        } catch (IOException ex) {
+          Assert.fail("error ex !!!" + ex);
+        }
+      }
+    }),
+
+    FILTER_XOR_STRATEGY(new FilterTesterStrategy() {
+
+      @Override
+      public void assertWhat(Filter filter, int numInsertions, int hashId,
+          ImmutableSet<Integer> falsePositives) {
+        Filter symmetricFilter = getSymmetricFilter(filter.getClass(),
+            numInsertions, hashId);
+        try {
+          // 0 xor 0 -> 0
+          filter.xor(symmetricFilter);
+          // check on present all key
+          for (int i = 0; i < numInsertions; i++) {
+            Assert.assertFalse(" filter might contains " + i,
+                filter.membershipTest(new Key(Integer.toString(i).getBytes())));
+          }
+
+          // add all even keys
+          for (int i = 0; i < numInsertions; i += 2) {
+            filter.add(new Key(Integer.toString(i).getBytes()));
+          }
+
+          // add all odd keys
+          for (int i = 0; i < numInsertions; i += 2) {
+            symmetricFilter.add(new Key(Integer.toString(i).getBytes()));
+          }
+
+          filter.xor(symmetricFilter);
+          // 1 xor 1 -> 0
+          // check on absent all key
+          for (int i = 0; i < numInsertions; i++) {
+            Assert.assertFalse(" filter might not contains " + i,
+                filter.membershipTest(new Key(Integer.toString(i).getBytes())));
+          }
+
+        } catch (UnsupportedOperationException ex) {
+          // not all Filter's implements this method
+          return;
+        }
+      }
+    }),
+
+    FILTER_AND_STRATEGY(new FilterTesterStrategy() {
+
+      @Override
+      public void assertWhat(Filter filter, int numInsertions, int hashId,
+          ImmutableSet<Integer> falsePositives) {
+
+        int startIntersection = numInsertions - (numInsertions - 100);
+        int endIntersection = numInsertions - 100;
+
+        Filter partialFilter = getSymmetricFilter(filter.getClass(),
+            numInsertions, hashId);
+
+        for (int i = 0; i < numInsertions; i++) {
+          String digit = Integer.toString(i);
+          filter.add(new Key(digit.getBytes()));
+          if (i >= startIntersection && i <= endIntersection) {
+            partialFilter.add(new Key(digit.getBytes()));
+          }
+        }
+
+        // do logic AND
+        filter.and(partialFilter);
+
+        for (int i = 0; i < numInsertions; i++) {
+          if (i >= startIntersection && i <= endIntersection) {
+            Assert.assertTrue(" filter might contains " + i,
+                filter.membershipTest(new Key(Integer.toString(i).getBytes())));
+          }
+        }        
+      }
+    }),
+
+    FILTER_OR_STRATEGY(new FilterTesterStrategy() {
+
+      @Override
+      public void assertWhat(Filter filter, int numInsertions, int hashId,
+          ImmutableSet<Integer> falsePositives) {
+        Filter evenFilter = getSymmetricFilter(filter.getClass(),
+            numInsertions, hashId);
+
+        // add all even
+        for (int i = 0; i < numInsertions; i += 2) {
+          evenFilter.add(new Key(Integer.toString(i).getBytes()));
+        }
+
+        // add all odd
+        for (int i = 1; i < numInsertions; i += 2) {
+          filter.add(new Key(Integer.toString(i).getBytes()));
+        }
+
+        // union odd with even
+        filter.or(evenFilter);
+
+        // check on present all key
+        for (int i = 0; i < numInsertions; i++) {
+          Assert.assertTrue(" filter might contains " + i,
+              filter.membershipTest(new Key(Integer.toString(i).getBytes())));
+        }        
+      }
+    });
+
+    private final FilterTesterStrategy testerStrategy;
+
+    BloomFilterTestStrategy(FilterTesterStrategy testerStrategy) {
+      this.testerStrategy = testerStrategy;
+    }
+
+    public FilterTesterStrategy getStrategy() {
+      return testerStrategy;
+    }
+
+  }
+
+  interface PreAssertionHelper {
+    public ImmutableSet<Integer> falsePositives(int hashId);
+  }
+
+}

Propchange: hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/BloomFilterCommonTester.java
------------------------------------------------------------------------------
    svn:eol-style = native

Added: hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/TestBloomFilters.java
URL: http://svn.apache.org/viewvc/hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/TestBloomFilters.java?rev=1528620&view=auto
==============================================================================
--- hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/TestBloomFilters.java
(added)
+++ hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/TestBloomFilters.java
Wed Oct  2 20:50:42 2013
@@ -0,0 +1,240 @@
+package org.apache.hadoop.util.bloom;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import static org.junit.Assert.assertFalse;
+import static org.junit.Assert.assertNotNull;
+import static org.junit.Assert.assertTrue;
+
+import java.util.AbstractCollection;
+import java.util.Iterator;
+
+import org.apache.hadoop.util.bloom.BloomFilterCommonTester.BloomFilterTestStrategy;
+import org.apache.hadoop.util.hash.Hash;
+import org.junit.Assert;
+import org.junit.Test;
+
+import com.google.common.collect.ImmutableList;
+import com.google.common.collect.ImmutableMap;
+import com.google.common.collect.ImmutableSet;
+
+public class TestBloomFilters {
+
+  int numInsertions = 1000;
+  int bitSize = BloomFilterCommonTester.optimalNumOfBits(numInsertions, 0.03);
+  int hashFunctionNumber = 5;
+
+  private static final ImmutableMap<Integer, ? extends AbstractCollection<Key>>
FALSE_POSITIVE_UNDER_1000 = ImmutableMap
+      .of(Hash.JENKINS_HASH, new AbstractCollection<Key>() {
+        final ImmutableList<Key> falsePositive = ImmutableList.<Key> of(
+            new Key("99".getBytes()), new Key("963".getBytes()));
+
+        @Override
+        public Iterator<Key> iterator() {
+          return falsePositive.iterator();
+        }
+
+        @Override
+        public int size() {
+          return falsePositive.size();
+        }
+      }, Hash.MURMUR_HASH, new AbstractCollection<Key>() {
+        final ImmutableList<Key> falsePositive = ImmutableList.<Key> of(
+            new Key("769".getBytes()), new Key("772".getBytes()),
+            new Key("810".getBytes()), new Key("874".getBytes()));
+
+        @Override
+        public Iterator<Key> iterator() {
+          return falsePositive.iterator();
+        }
+
+        @Override
+        public int size() {
+          return falsePositive.size();
+        }
+      });
+
+  private enum Digits {
+    ODD(1), EVEN(0);
+
+    int start;
+
+    Digits(int start) {
+      this.start = start;
+    }
+
+    int getStart() {
+      return start;
+    }
+  }
+  
+  @Test
+  public void testDynamicBloomFilter() {
+    int hashId = Hash.JENKINS_HASH;    
+    Filter filter = new DynamicBloomFilter(bitSize, hashFunctionNumber,
+        Hash.JENKINS_HASH, 3);    
+    BloomFilterCommonTester.of(hashId, numInsertions)
+        .withFilterInstance(filter)
+        .withTestCases(ImmutableSet.of(BloomFilterTestStrategy.KEY_TEST_STRATEGY,
+                BloomFilterTestStrategy.ADD_KEYS_STRATEGY,
+                BloomFilterTestStrategy.EXCEPTIONS_CHECK_STRATEGY,
+                BloomFilterTestStrategy.WRITE_READ_STRATEGY,
+                BloomFilterTestStrategy.ODD_EVEN_ABSENT_STRATEGY))
+                .test();
+    
+    assertNotNull("testDynamicBloomFilter error ", filter.toString());
+  }
+
+  @Test
+  public void testCountingBloomFilter() {
+    int hashId = Hash.JENKINS_HASH;
+
+    CountingBloomFilter filter = new CountingBloomFilter(bitSize,
+        hashFunctionNumber, hashId);
+
+    Key key = new Key(new byte[] { 48, 48 });
+
+    filter.add(key);
+    assertTrue("CountingBloomFilter.membership error ",
+        filter.membershipTest(key));
+    assertTrue("CountingBloomFilter.approximateCount error",
+        filter.approximateCount(key) == 1);
+
+    filter.add(key);
+    assertTrue("CountingBloomFilter.approximateCount error",
+        filter.approximateCount(key) == 2);
+
+    filter.delete(key);
+    assertTrue("CountingBloomFilter.membership error ",
+        filter.membershipTest(key));
+
+    filter.delete(key);
+    assertFalse("CountingBloomFilter.membership error ",
+        filter.membershipTest(key));
+    assertTrue("CountingBloomFilter.approximateCount error",
+        filter.approximateCount(key) == 0);
+
+    BloomFilterCommonTester.of(hashId, numInsertions)
+        .withFilterInstance(filter)
+        .withTestCases(ImmutableSet.of(BloomFilterTestStrategy.KEY_TEST_STRATEGY,
+                BloomFilterTestStrategy.ADD_KEYS_STRATEGY,
+                BloomFilterTestStrategy.EXCEPTIONS_CHECK_STRATEGY,
+                BloomFilterTestStrategy.ODD_EVEN_ABSENT_STRATEGY,
+                BloomFilterTestStrategy.WRITE_READ_STRATEGY,
+                BloomFilterTestStrategy.FILTER_OR_STRATEGY,
+                BloomFilterTestStrategy.FILTER_XOR_STRATEGY)).test();
+  }
+
+  @Test
+  public void testRetouchedBloomFilterSpecific() {
+    int numInsertions = 1000;
+    int hashFunctionNumber = 5;
+
+    ImmutableSet<Integer> hashes = ImmutableSet.of(Hash.MURMUR_HASH,
+        Hash.JENKINS_HASH);
+
+    for (Integer hashId : hashes) {      
+      RetouchedBloomFilter filter = new RetouchedBloomFilter(bitSize,
+          hashFunctionNumber, hashId);
+
+      checkOnAbsentFalsePositive(hashId, numInsertions, filter, Digits.ODD,
+          RemoveScheme.MAXIMUM_FP);
+      filter.and(new RetouchedBloomFilter(bitSize, hashFunctionNumber, hashId));
+
+      checkOnAbsentFalsePositive(hashId, numInsertions, filter, Digits.EVEN,
+          RemoveScheme.MAXIMUM_FP);
+      filter.and(new RetouchedBloomFilter(bitSize, hashFunctionNumber, hashId));
+
+      checkOnAbsentFalsePositive(hashId, numInsertions, filter, Digits.ODD,
+          RemoveScheme.MINIMUM_FN);
+      filter.and(new RetouchedBloomFilter(bitSize, hashFunctionNumber, hashId));
+
+      checkOnAbsentFalsePositive(hashId, numInsertions, filter, Digits.EVEN,
+          RemoveScheme.MINIMUM_FN);
+      filter.and(new RetouchedBloomFilter(bitSize, hashFunctionNumber, hashId));
+
+      checkOnAbsentFalsePositive(hashId, numInsertions, filter, Digits.ODD,
+          RemoveScheme.RATIO);
+      filter.and(new RetouchedBloomFilter(bitSize, hashFunctionNumber, hashId));
+
+      checkOnAbsentFalsePositive(hashId, numInsertions, filter, Digits.EVEN,
+          RemoveScheme.RATIO);
+      filter.and(new RetouchedBloomFilter(bitSize, hashFunctionNumber, hashId));
+    }
+  }
+
+  private void checkOnAbsentFalsePositive(int hashId, int numInsertions,
+      final RetouchedBloomFilter filter, Digits digits, short removeSchema) {
+    AbstractCollection<Key> falsePositives = FALSE_POSITIVE_UNDER_1000
+        .get(hashId);
+
+    if (falsePositives == null)
+      Assert.fail(String.format("false positives for hash %d not founded",
+          hashId));
+
+    filter.addFalsePositive(falsePositives);
+
+    for (int i = digits.getStart(); i < numInsertions; i += 2) {
+      filter.add(new Key(Integer.toString(i).getBytes()));
+    }
+
+    for (Key key : falsePositives) {
+      filter.selectiveClearing(key, removeSchema);
+    }
+
+    for (int i = 1 - digits.getStart(); i < numInsertions; i += 2) {
+      assertFalse(" testRetouchedBloomFilterAddFalsePositive error " + i,
+          filter.membershipTest(new Key(Integer.toString(i).getBytes())));
+    }
+  }
+
+  @Test
+  public void testFiltersWithJenkinsHash() {
+    int hashId = Hash.JENKINS_HASH;
+
+    BloomFilterCommonTester.of(hashId, numInsertions)
+        .withFilterInstance(new BloomFilter(bitSize, hashFunctionNumber, hashId))
+        .withFilterInstance(new RetouchedBloomFilter(bitSize, hashFunctionNumber, hashId))
+        .withTestCases(ImmutableSet.of(BloomFilterTestStrategy.KEY_TEST_STRATEGY,
+                BloomFilterTestStrategy.ADD_KEYS_STRATEGY,
+                BloomFilterTestStrategy.EXCEPTIONS_CHECK_STRATEGY,
+                BloomFilterTestStrategy.ODD_EVEN_ABSENT_STRATEGY,
+                BloomFilterTestStrategy.WRITE_READ_STRATEGY,
+                BloomFilterTestStrategy.FILTER_OR_STRATEGY,
+                BloomFilterTestStrategy.FILTER_AND_STRATEGY,
+                BloomFilterTestStrategy.FILTER_XOR_STRATEGY)).test();
+  }
+
+  @Test
+  public void testFiltersWithMurmurHash() {
+    int hashId = Hash.MURMUR_HASH;
+
+    BloomFilterCommonTester.of(hashId, numInsertions)
+        .withFilterInstance(new BloomFilter(bitSize, hashFunctionNumber, hashId))
+        .withFilterInstance(new RetouchedBloomFilter(bitSize, hashFunctionNumber, hashId))
+        .withTestCases(ImmutableSet.of(BloomFilterTestStrategy.KEY_TEST_STRATEGY,
+                BloomFilterTestStrategy.ADD_KEYS_STRATEGY,
+                BloomFilterTestStrategy.EXCEPTIONS_CHECK_STRATEGY,
+                BloomFilterTestStrategy.ODD_EVEN_ABSENT_STRATEGY,
+                BloomFilterTestStrategy.WRITE_READ_STRATEGY,
+                BloomFilterTestStrategy.FILTER_OR_STRATEGY,
+                BloomFilterTestStrategy.FILTER_AND_STRATEGY,
+                BloomFilterTestStrategy.FILTER_XOR_STRATEGY)).test();
+  }
+}

Propchange: hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/bloom/TestBloomFilters.java
------------------------------------------------------------------------------
    svn:eol-style = native

Added: hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/hash/TestHash.java
URL: http://svn.apache.org/viewvc/hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/hash/TestHash.java?rev=1528620&view=auto
==============================================================================
--- hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/hash/TestHash.java
(added)
+++ hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/hash/TestHash.java
Wed Oct  2 20:50:42 2013
@@ -0,0 +1,89 @@
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.hadoop.util.hash;
+
+import static org.junit.Assert.*;
+import org.apache.hadoop.conf.Configuration;
+import org.junit.Test;
+
+public class TestHash {
+  static final String LINE = "34563@45kjkksdf/ljfdb9d8fbusd*89uggjsk<dfgjsdfh@sddc2q3esc";
+
+  @Test
+  public void testHash() {
+    int iterations = 30;
+    assertTrue("testHash jenkins error !!!",
+        Hash.JENKINS_HASH == Hash.parseHashType("jenkins"));
+    assertTrue("testHash murmur error !!!",
+        Hash.MURMUR_HASH == Hash.parseHashType("murmur"));
+    assertTrue("testHash undefined",
+        Hash.INVALID_HASH == Hash.parseHashType("undefined"));
+
+    Configuration cfg = new Configuration();
+    cfg.set("hadoop.util.hash.type", "murmur");
+    assertTrue("testHash", MurmurHash.getInstance() == Hash.getInstance(cfg));
+
+    cfg = new Configuration();
+    cfg.set("hadoop.util.hash.type", "jenkins");
+    assertTrue("testHash jenkins configuration error !!!",
+        JenkinsHash.getInstance() == Hash.getInstance(cfg));
+
+    cfg = new Configuration();
+    assertTrue("testHash undefine configuration error !!!",
+        MurmurHash.getInstance() == Hash.getInstance(cfg));
+
+    assertTrue("testHash error jenkin getInstance !!!",
+        JenkinsHash.getInstance() == Hash.getInstance(Hash.JENKINS_HASH));
+    assertTrue("testHash error murmur getInstance !!!",
+        MurmurHash.getInstance() == Hash.getInstance(Hash.MURMUR_HASH));
+
+    assertNull("testHash error invalid getInstance !!!",
+        Hash.getInstance(Hash.INVALID_HASH));
+
+    int murmurHash = Hash.getInstance(Hash.MURMUR_HASH).hash(LINE.getBytes());
+    for (int i = 0; i < iterations; i++) {
+      assertTrue("multiple evaluation murmur hash error !!!",
+          murmurHash == Hash.getInstance(Hash.MURMUR_HASH)
+              .hash(LINE.getBytes()));
+    }
+
+    murmurHash = Hash.getInstance(Hash.MURMUR_HASH).hash(LINE.getBytes(), 67);
+    for (int i = 0; i < iterations; i++) {
+      assertTrue(
+          "multiple evaluation murmur hash error !!!",
+          murmurHash == Hash.getInstance(Hash.MURMUR_HASH).hash(
+              LINE.getBytes(), 67));
+    }
+
+    int jenkinsHash = Hash.getInstance(Hash.JENKINS_HASH).hash(LINE.getBytes());
+    for (int i = 0; i < iterations; i++) {
+      assertTrue(
+          "multiple evaluation jenkins hash error !!!",
+          jenkinsHash == Hash.getInstance(Hash.JENKINS_HASH).hash(
+              LINE.getBytes()));
+    }
+
+    jenkinsHash = Hash.getInstance(Hash.JENKINS_HASH).hash(LINE.getBytes(), 67);
+    for (int i = 0; i < iterations; i++) {
+      assertTrue(
+          "multiple evaluation jenkins hash error !!!",
+          jenkinsHash == Hash.getInstance(Hash.JENKINS_HASH).hash(
+              LINE.getBytes(), 67));
+    }   
+  } 
+}

Propchange: hadoop/common/trunk/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/util/hash/TestHash.java
------------------------------------------------------------------------------
    svn:eol-style = native



Mime
View raw message