adding an XOR/Fuse benchmark

lemire · lemire · commit a808079b7524 · 2026-01-06T09:51:18.000-05:00
diff --git a/README.md b/README.md
@@ -87,5 +87,72 @@ and with less than 1% probability "Found" or "Found; common".
 
 Internally, the tool uses a xor+ filter (see above) with 8 bits per fingerprint. Actually, 1024 smaller filters (segments) are made, the segment id being the highest 10 bits of the key. The lowest bit of the key is set to either 0 (regular) or 1 (common), and so two lookups are made per password. Because of that, the false positive rate is twice of what it would be with just one lookup (0.0078 instead of 0.0039). A regular Bloom filter with the same guarantees would be ~760 MB. For each lookup, one filter segment (so, less than 1 MB) are read from the file.
 
+## Benchmarks
+
+The project includes JMH (Java Microbenchmark Harness) benchmarks to measure the performance of the filters.
+
+### Running Benchmarks
+
+#### Option 1: Run via Maven (recommended)
+
+To run the benchmarks directly from Maven (with minimal iterations for quick testing):
+
+    mvn -pl jmh clean package exec:exec@run-benchmarks
+
+For full benchmarks, modify the pom.xml or run the JAR manually with custom parameters.
+
+This will compile and execute the JMH benchmarks for the XOR filters (XOR_8, XOR_16, XOR_BINARY_FUSE_8, XOR_BINARY_FUSE_16).
+
+#### Option 2: Run the JAR manually
+
+First, build the project:
+
+    mvn clean package
+
+Then run the benchmarks:
+
+    java -jar jmh/target/benchmarks.jar org.fastfilter.FilterBenchmark
+
+To run benchmarks for a specific filter type:
+
+    java -jar jmh/target/benchmarks.jar org.fastfilter.FilterBenchmark -p filterType=XOR_BINARY_FUSE_8
+
+Available filter types: `XOR_8`, `XOR_16`, `XOR_BINARY_FUSE_8`, `XOR_BINARY_FUSE_16`.
+
+### Benchmark Details
+
+The benchmarks measure:
+- Average time per operation (nanoseconds) for lookups of existing and non-existing keys
+- Throughput (operations per second) for the same operations
+- False positive rate validation
+
+
+Possible results:
+
+```
+
+Benchmark                                                     (filterType)   Mode  Cnt          Score   Error  Units
+FilterBenchmark.benchmarkContainsExistingThroughput                  XOR_8  thrpt       412364492,755          ops/s
+FilterBenchmark.benchmarkContainsExistingThroughput                 XOR_16  thrpt       397627818,837          ops/s
+FilterBenchmark.benchmarkContainsExistingThroughput      XOR_BINARY_FUSE_8  thrpt       516262004,459          ops/s
+FilterBenchmark.benchmarkContainsExistingThroughput     XOR_BINARY_FUSE_16  thrpt       489256453,340          ops/s
+FilterBenchmark.benchmarkContainsNonExistingThroughput               XOR_8  thrpt       429856367,135          ops/s
+FilterBenchmark.benchmarkContainsNonExistingThroughput              XOR_16  thrpt       441042890,257          ops/s
+FilterBenchmark.benchmarkContainsNonExistingThroughput   XOR_BINARY_FUSE_8  thrpt       533609392,046          ops/s
+FilterBenchmark.benchmarkContainsNonExistingThroughput  XOR_BINARY_FUSE_16  thrpt       540058414,150          ops/s
+FilterBenchmark.benchmarkContainsExisting                            XOR_8   avgt               2,475          ns/op
+FilterBenchmark.benchmarkContainsExisting                           XOR_16   avgt               2,522          ns/op
+FilterBenchmark.benchmarkContainsExisting                XOR_BINARY_FUSE_8   avgt               1,965          ns/op
+FilterBenchmark.benchmarkContainsExisting               XOR_BINARY_FUSE_16   avgt               2,060          ns/op
+FilterBenchmark.benchmarkContainsNonExisting                         XOR_8   avgt               2,347          ns/op
+FilterBenchmark.benchmarkContainsNonExisting                        XOR_16   avgt               2,295          ns/op
+FilterBenchmark.benchmarkContainsNonExisting             XOR_BINARY_FUSE_8   avgt               1,892          ns/op
+FilterBenchmark.benchmarkContainsNonExisting            XOR_BINARY_FUSE_16   avgt               1,903          ns/op
+```
+
+This indicates that we can issue about half a billion queries per second, and sustain a rate of about 2 ns per query.
+
+The benchmarks use 1,000,000 keys by default. You can modify the `NUM_KEYS` constant in `FilterBenchmark.java` for smaller/larger test sets.
+
 
 
diff --git a/jmh/pom.xml b/jmh/pom.xml
@@ -39,6 +39,13 @@
                     <fork>true</fork>
                     <source>${maven.compiler.source}</source>
                     <target>${maven.compiler.target}</target>
+                    <annotationProcessorPaths>
+                        <path>
+                            <groupId>org.openjdk.jmh</groupId>
+                            <artifactId>jmh-generator-annprocess</artifactId>
+                            <version>${jmh.version}</version>
+                        </path>
+                    </annotationProcessorPaths>
                     <showDeprecation>true</showDeprecation>
                     <failOnError>true</failOnError>
                     <showWarnings>true</showWarnings>
@@ -67,6 +74,34 @@
                     </execution>
                 </executions>
             </plugin>
+
+            <plugin>
+                <groupId>org.codehaus.mojo</groupId>
+                <artifactId>exec-maven-plugin</artifactId>
+                <version>3.1.0</version>
+                <executions>
+                    <execution>
+                        <id>run-benchmarks</id>
+                        <goals>
+                            <goal>exec</goal>
+                        </goals>
+                        <configuration>
+                            <executable>java</executable>
+                            <arguments>
+                                <argument>-jar</argument>
+                                <argument>${project.build.directory}/benchmarks.jar</argument>
+                                <argument>org.fastfilter.FilterBenchmark</argument>
+                                <argument>-f</argument>
+                                <argument>1</argument>
+                                <argument>-wi</argument>
+                                <argument>1</argument>
+                                <argument>-i</argument>
+                                <argument>1</argument>
+                            </arguments>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
         </plugins>
     </build>
 
diff --git a/jmh/src/main/java/org/fastfilter/FilterBenchmark.java b/jmh/src/main/java/org/fastfilter/FilterBenchmark.java
@@ -0,0 +1,130 @@
+package org.fastfilter;
+
+import org.openjdk.jmh.annotations.*;
+import org.openjdk.jmh.infra.Blackhole;
+import org.openjdk.jmh.runner.Runner;
+import org.openjdk.jmh.runner.RunnerException;
+import org.openjdk.jmh.runner.options.Options;
+import org.openjdk.jmh.runner.options.OptionsBuilder;
+
+import org.fastfilter.Filter;
+import org.fastfilter.xor.Xor8;
+import org.fastfilter.xor.Xor16;
+import org.fastfilter.xor.XorBinaryFuse8;
+import org.fastfilter.xor.XorBinaryFuse16;
+
+import java.util.concurrent.TimeUnit;
+
+@BenchmarkMode(Mode.AverageTime)
+@OutputTimeUnit(TimeUnit.NANOSECONDS)
+@Warmup(iterations = 3, time = 1, timeUnit = TimeUnit.SECONDS)
+@Measurement(iterations = 5, time = 1, timeUnit = TimeUnit.SECONDS)
+@Fork(1)
+@State(Scope.Benchmark)
+public class FilterBenchmark {
+
+    @Param({"XOR_8", "XOR_16", "XOR_BINARY_FUSE_8", "XOR_BINARY_FUSE_16"})
+    public String filterType;
+
+    private Filter filter;
+    private long[] testKeys;
+    private final int NUM_KEYS = 1_000_000;
+
+    @Setup
+    public void setup() {
+        // Create 1,000,000 keys (even numbers)
+        testKeys = new long[NUM_KEYS];
+        for (int i = 0; i < testKeys.length; i++) {
+            testKeys[i] = (long) i * 2L; // even numbers
+        }
+
+        try {
+            switch (filterType) {
+                case "XOR_8":
+                    filter = Xor8.construct(testKeys);
+                    break;
+                case "XOR_16":
+                    filter = Xor16.construct(testKeys);
+                    break;
+                case "XOR_BINARY_FUSE_8":
+                    filter = XorBinaryFuse8.construct(testKeys);
+                    break;
+                case "XOR_BINARY_FUSE_16":
+                    filter = XorBinaryFuse16.construct(testKeys);
+                    break;
+                default:
+                    throw new IllegalArgumentException("Unknown filter type: " + filterType);
+            }
+        } catch (Throwable e) {
+            throw new RuntimeException(e);
+        }
+    }
+
+    @TearDown
+    public void tearDown() {
+        filter = null;
+        testKeys = null;
+    }
+
+    @Benchmark
+    @OperationsPerInvocation(NUM_KEYS)
+    public void benchmarkContainsExisting(Blackhole blackhole) throws Throwable {
+        for (long key : testKeys) {
+            if (!filter.mayContain(key)) {
+                throw new RuntimeException("Key should exist: " + key);
+            }
+        }
+    }
+
+    @Benchmark
+    @OperationsPerInvocation(NUM_KEYS)
+    public void benchmarkContainsNonExisting(Blackhole blackhole) throws Throwable {
+        int fp = 0;
+        for (int i = 0; i < testKeys.length; i++) {
+            long key = (long) i * 2L + 1L; // odd numbers
+            if (filter.mayContain(key)) {
+                fp++;
+            }
+        }
+        if (fp > 10000) {
+            throw new RuntimeException("Too many false positives: " + fp);
+        }
+    }
+
+    @Benchmark
+    @BenchmarkMode(Mode.Throughput)
+    @OutputTimeUnit(TimeUnit.SECONDS)
+    @OperationsPerInvocation(NUM_KEYS)
+    public void benchmarkContainsExistingThroughput(Blackhole blackhole) throws Throwable {
+        for (long key : testKeys) {
+            if (!filter.mayContain(key)) {
+                throw new RuntimeException("Key should exist: " + key);
+            }
+        }
+    }
+
+    @Benchmark
+    @BenchmarkMode(Mode.Throughput)
+    @OutputTimeUnit(TimeUnit.SECONDS)
+    @OperationsPerInvocation(NUM_KEYS)
+    public void benchmarkContainsNonExistingThroughput(Blackhole blackhole) throws Throwable {
+        int fp = 0;
+        for (int i = 0; i < testKeys.length; i++) {
+            long key = (long) i * 2L + 1L; // odd numbers
+            if (filter.mayContain(key)) {
+                fp++;
+            }
+        }
+        if (fp > 10000) {
+            throw new RuntimeException("Too many false positives: " + fp);
+        }
+    }
+
+    public static void main(String[] args) throws RunnerException {
+        Options opt = new OptionsBuilder()
+                .include(FilterBenchmark.class.getSimpleName())
+                .build();
+
+        new Runner(opt).run();
+    }
+}