本文基於Spring Boot 2.6.6、redisson 3.16.0簡單分析Redisson布隆過濾器的使用。
<dependency> <groupId>org.springframework.boot</groupId> <artifactId>spring-boot-starter-data-redis</artifactId> <exclusions> <exclusion> <groupId>io.lettuce</groupId> <artifactId>lettuce-core</artifactId> </exclusion> </exclusions> </dependency> <dependency> <groupId>redis.clients</groupId> <artifactId>jedis</artifactId> </dependency> <dependency> <groupId>org.redisson</groupId> <artifactId>redisson</artifactId> <version>3.16.0</version> </dependency>
public class BloomFilterDemo { public static void main(String[] args) { Config config = new Config(); config.useSingleServer().setAddress("redis://"); RedissonClient redissonClient = Redisson.create(config); RBloomFilter<String> bloomFilter = redissonClient.getBloomFilter("bloom-filter"); // 初始化布隆過濾器 bloomFilter.tryInit(200, 0.01); List<String> elements = new ArrayList<>(); for (int i = 0; i < 200; i++) { elements.add(UUID.randomUUID().toString()); } // 向布隆過濾器中新增內容 init(bloomFilter, elements); // 測試檢索效果 test(bloomFilter, elements); redissonClient.shutdown(); } public static void init(RBloomFilter<String> bloomFilter, List<String> elements) { for (int i = 0; i < elements.size(); i++) { if (i % 2 == 0) { bloomFilter.add(elements.get(i)); } } } public static void test(RBloomFilter<String> bloomFilter, List<String> elements) { int counter = 0; for (String element : elements) { if (bloomFilter.contains(element)) { counter++; } } System.out.println(counter); } }
public boolean tryInit(long expectedInsertions, double falseProbability) { if (falseProbability > 1) { throw new IllegalArgumentException("Bloom filter false probability can't be greater than 1"); } if (falseProbability < 0) { throw new IllegalArgumentException("Bloom filter false probability can't be negative"); } // 根據元素個數和錯誤率計算得到向量長度 size = optimalNumOfBits(expectedInsertions, falseProbability); if (size == 0) { throw new IllegalArgumentException("Bloom filter calculated size is " + size); } if (size > getMaxSize()) { throw new IllegalArgumentException("Bloom filter size can't be greater than " + getMaxSize() + ". But calculated size is " + size); } // 根據元素個數和向量長度計算得到雜湊函數的個數 hashIterations = optimalNumOfHashFunctions(expectedInsertions, size); CommandBatchService executorService = new CommandBatchService(commandExecutor); executorService.evalReadAsync(configName, codec, RedisCommands.EVAL_VOID, "local size = redis.call('hget', KEYS[1], 'size');" + "local hashIterations = redis.call('hget', KEYS[1], 'hashIterations');" + "assert(size == false and hashIterations == false, 'Bloom filter config has been changed')", Arrays.<Object>asList(configName), size, hashIterations); executorService.writeAsync(configName, StringCodec.INSTANCE, new RedisCommand<Void>("HMSET", new VoidReplayConvertor()), configName, "size", size, "hashIterations", hashIterations, "expectedInsertions", expectedInsertions, "falseProbability", BigDecimal.valueOf(falseProbability).toPlainString()); try { executorService.execute(); } catch (RedisException e) { if (e.getMessage() == null || !e.getMessage().contains("Bloom filter config has been changed")) { throw e; } readConfig(); return false; } return true; } private long optimalNumOfBits(long n, double p) { if (p == 0) { p = Double.MIN_VALUE; } return (long) (-n * Math.log(p) / (Math.log(2) * Math.log(2))); } private int optimalNumOfHashFunctions(long n, long m) { return Math.max(1, (int) Math.round((double) m / n * Math.log(2))); }
public boolean add(T object) { // 根據帶插入元素得到兩個long型別雜湊值 long[] hashes = hash(object); while (true) { if (size == 0) { readConfig(); } int hashIterations = this.hashIterations; long size = this.size; // 得到位下標陣列 // 以兩個雜湊值根據指定策略生成hashIterations個雜湊值,從而得到位下標 long[] indexes = hash(hashes[0], hashes[1], hashIterations, size); CommandBatchService executorService = new CommandBatchService(commandExecutor); addConfigCheck(hashIterations, size, executorService); RBitSetAsync bs = createBitSet(executorService); for (int i = 0; i < indexes.length; i++) { // 將位下標對應位設定1 bs.setAsync(indexes[i]); } try { List<Boolean> result = (List<Boolean>) executorService.execute().getResponses(); for (Boolean val : result.subList(1, result.size()-1)) { if (!val) { // 元素新增成功 return true; } } // 元素已存在 return false; } catch (RedisException e) { if (e.getMessage() == null || !e.getMessage().contains("Bloom filter config has been changed")) { throw e; } } } } private long[] hash(Object object) { ByteBuf state = encode(object); try { return Hash.hash128(state); } finally { state.release(); } } private long[] hash(long hash1, long hash2, int iterations, long size) { long[] indexes = new long[iterations]; long hash = hash1; for (int i = 0; i < iterations; i++) { indexes[i] = (hash & Long.MAX_VALUE) % size; // 雜湊函數的實現方式 if (i % 2 == 0) { // 新雜湊值 hash += hash2; } else { // 新雜湊值 hash += hash1; } } return indexes; }
public boolean contains(T object) { // 根據帶插入元素得到兩個long型別雜湊值 long[] hashes = hash(object); while (true) { if (size == 0) { readConfig(); } int hashIterations = this.hashIterations; long size = this.size; // 得到位下標陣列 // 以兩個雜湊值根據指定策略生成hashIterations個雜湊值,從而得到位下標 long[] indexes = hash(hashes[0], hashes[1], hashIterations, size); CommandBatchService executorService = new CommandBatchService(commandExecutor); addConfigCheck(hashIterations, size, executorService); RBitSetAsync bs = createBitSet(executorService); for (int i = 0; i < indexes.length; i++) { // 獲取位下標對應位的值 bs.getAsync(indexes[i]); } try { List<Boolean> result = (List<Boolean>) executorService.execute().getResponses(); for (Boolean val : result.subList(1, result.size()-1)) { if (!val) { // 若存在不為1的位,則認為元素不存在 return false; } } // 都為1,則認為元素存在 return true; } catch (RedisException e) { if (e.getMessage() == null || !e.getMessage().contains("Bloom filter config has been changed")) { throw e; } } } }
