/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. */ package org.apache.cassandra.utils; import java.io.ByteArrayInputStream; import java.io.DataInputStream; import java.io.IOException; import java.nio.ByteBuffer; import java.util.HashSet; import java.util.Iterator; import java.util.Set; import org.junit.Test; import org.apache.cassandra.io.util.DataOutputBuffer; import org.apache.cassandra.utils.BKeyGenerator.RandomStringGenerator; public class FilterTest { public void testManyHashes(Iterator<String> keys) { int MAX_HASH_COUNT = 128; Set<Long> hashes = new HashSet<Long>(); int collisions = 0; while (keys.hasNext()) { hashes.clear(); String key = keys.next(); long[] hashBuckets = BloomFilter.getHashBuckets(key, MAX_HASH_COUNT, 1024 * 1024); for (long hashIndex : hashBuckets) { hashes.add(hashIndex); } collisions += (MAX_HASH_COUNT - hashes.size()); if (MAX_HASH_COUNT != hashes.size()) { System.out.println(key+": collisins: "+collisions+", hashSize:"+hashes.size()+", buckets:"+hashBuckets.length); } } assert collisions <= 200; } @Test public void testManyRandom() { testManyHashes(randomKeys()); } /* public void testManyHashes(Iterator<ByteBuffer> keys) { int MAX_HASH_COUNT = 128; Set<Long> hashes = new HashSet<Long>(); int collisions = 0; while (keys.hasNext()) { hashes.clear(); ByteBuffer key = keys.next(); long[] hashBuckets = BloomFilter.getHashBuckets(key, MAX_HASH_COUNT, 1024 * 1024); for (long hashIndex : hashBuckets) { hashes.add(hashIndex); } collisions += (MAX_HASH_COUNT - hashes.size()); if (MAX_HASH_COUNT != hashes.size()) { System.out.println(key+": collisins: "+collisions+", hashSize:"+hashes.size()+", buckets:"+hashBuckets.length); } } assert collisions <= 100; } @Test public void testManyRandom() { testManyHashes(randomBKeys()); } */ // used by filter subclass tests static final double MAX_FAILURE_RATE = 0.1; public static final BloomCalculations.BloomSpecification spec = BloomCalculations.computeBloomSpec(15, MAX_FAILURE_RATE); static final int ELEMENTS = 10000; static final ResetableIterator<String> intKeys() { return new KeyGenerator.IntGenerator(ELEMENTS); } static final ResetableIterator<String> randomKeys() { return new KeyGenerator.RandomStringGenerator(314159, ELEMENTS); } static final RandomStringGenerator randomBKeys() { return new BKeyGenerator.RandomStringGenerator(314159, ELEMENTS); } static final ResetableIterator<String> randomKeys2() { return new KeyGenerator.RandomStringGenerator(271828, ELEMENTS); } public static void testFalsePositives(Filter f, ResetableIterator<String> keys, ResetableIterator<String> otherkeys) { assert keys.size() == otherkeys.size(); while (keys.hasNext()) { f.add(keys.next()); } int fp = 0; while (otherkeys.hasNext()) { if (f.isPresent(otherkeys.next())) { fp++; } } double fp_ratio = fp / (keys.size() * BloomCalculations.probs[spec.bucketsPerElement][spec.K]); assert fp_ratio < 1.03 : fp_ratio; } }