diff --git a/.github/workflows/bench.yml b/.github/workflows/bench.yml
index c7ce09f..f3002de 100644
--- a/.github/workflows/bench.yml
+++ b/.github/workflows/bench.yml
@@ -15,18 +15,30 @@ jobs:
     - uses: actions/checkout@v4
 
     - name: Benchmark
-      run: cargo bench --bench throughput --features 'bench-plot'
+      run: cargo bench --bench throughput --features bench-plot
+
+    - uses: actions/upload-artifact@v3
+      with:
+        name: benches
+        path: benches/throughput/x86_64.svg
+
+  benchmark-x86-avx2:
+    name: Benchmark X86 AVX2
+    runs-on: buildjet-2vcpu-ubuntu-2204
+
+    steps:
+    - uses: actions/checkout@v4
 
     - name: Switch to nightly rust
       run: rustup default nightly
 
-    - name: Benchmark AVX2 (nightly)
-      run: cargo bench --bench throughput --features 'bench-plot avx2'
+    - name: Benchmark
+      run: cargo bench --bench throughput --features bench-plot
 
     - uses: actions/upload-artifact@v3
       with:
         name: benches
-        path: benches/throughput/*.svg
+        path: benches/throughput/x86_64-hybrid.svg
 
   benchmark-arm:
     name: Benchmark ARM
@@ -36,17 +48,17 @@ jobs:
     - uses: actions/checkout@v4
 
     - name: Benchmark
-      run: cargo bench --bench throughput --features 'bench-plot'
+      run: cargo bench --bench throughput --features bench-plot
 
     - uses: actions/upload-artifact@v3
       with:
         name: benches
-        path: benches/throughput/*.svg
+        path: benches/throughput/aarch64.svg
 
   commit:
     name: Commit & Push
     runs-on: buildjet-2vcpu-ubuntu-2204
-    needs: [benchmark-x86, benchmark-arm]
+    needs: [benchmark-x86, benchmark-x86-avx2, benchmark-arm]
 
     permissions:
       contents: write
diff --git a/.github/workflows/build_test.yml b/.github/workflows/build_test.yml
index a178298..45e04cf 100644
--- a/.github/workflows/build_test.yml
+++ b/.github/workflows/build_test.yml
@@ -10,14 +10,44 @@ env:
   CARGO_TERM_COLOR: always
 
 jobs:
-  build_test:
+  build_test_x86:
+    name: Build & Test X86
+    runs-on: ubuntu-latest
+
+    steps:
+    - uses: actions/checkout@v3
 
-    name: Build & Test
+    - name: Build
+      run: cargo build --release
+
+    - name: Test
+      run: cargo test --release
+
+  build_test_x86_avx2:
+    name: Build & Test X86 AVX2
     runs-on: ubuntu-latest
 
     steps:
     - uses: actions/checkout@v3
+
+    - name: Switch to nightly rust
+      run: rustup default nightly
+
     - name: Build
       run: cargo build --release
+
+    - name: Test
+      run: cargo test --release
+
+  build_test_arm:
+    name: Build & Test ARM
+    runs-on: buildjet-2vcpu-ubuntu-2204-arm
+
+    steps:
+    - uses: actions/checkout@v3
+
+    - name: Build
+      run: cargo build --release
+
     - name: Test
       run: cargo test --release
\ No newline at end of file
diff --git a/Cargo.toml b/Cargo.toml
index 42ce8c3..289de9c 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -1,7 +1,7 @@
 [package]
 name = "gxhash"
 authors = ["Olivier Giniaux"]
-version = "2.3.0"
+version = "3.0.0"
 edition = "2021"
 description = "GxHash non-cryptographic algorithm"
 license = "MIT"
@@ -13,10 +13,6 @@ categories = ["algorithms", "data-structures", "no-std"]
 exclude = ["article/*"]
 
 [features]
-# The 256-bit state GxHash is faster for large inputs than the default 128-bit state implementation, but faster on smaller hashes.
-# Please not however that the 256-bit GxHash and the 128-bit GxHash don't generate the same hashes for a same input.
-# Requires AVX2 and VAES (X86).
-avx2 = []
 # Only relevant for throughput benchmarks
 bench-csv = []
 bench-md = []
@@ -39,6 +35,9 @@ seahash = "4.1.0"
 metrohash = "1.0.6"
 fnv = "1.0.3"
 
+[build-dependencies]
+rustc_version = "0.4.0"
+
 [dev-dependencies.plotters]
 version = "0.3.5"
 default-features = false
diff --git a/README.md b/README.md
index a18522d..eac8029 100644
--- a/README.md
+++ b/README.md
@@ -44,7 +44,7 @@ GxHash is compatible with:
 > Other platforms are currently not supported (there is no fallback). The behavior on these platforms is undefined.
 
 ### Hashes Stability
-All generated hashes for a given version of GxHash are stable, meaning that for a given input the output hash will be the same across all supported platforms. An exception to this is the AVX2 version of GxHash (nightly).
+All generated hashes for a given version of GxHash are stable, meaning that for a given input the output hash will be the same across all supported platforms.
 
 ## Benchmarks
 
@@ -74,7 +74,7 @@ GxHash is continuously benchmarked on X86 and ARM Github runners.
 GxHash is a seeded hashing algorithm, meaning that depending on the seed used, it will generate completely different hashes. The default `HasherBuilder` (`GxHasherBuilder::default()`) uses seed randomization, making any `HashMap`/`HashSet` more DOS resistant, as it will make it much more difficult for attackers to be able to predict which hashes may collide without knowing the seed used. This does not mean however that it is completely DOS resistant. This has to be analyzed further.
 
 ### Multicollisions Resistance
-GxHash uses a 128-bit internal state (and even 256-bit with the `avx2` feature). This makes GxHash [a widepipe construction](https://en.wikipedia.org/wiki/Merkle%E2%80%93Damg%C3%A5rd_construction#Wide_pipe_construction) when generating hashes of size 64-bit or smaller, which had amongst other properties to be inherently more resistant to multicollision attacks. See [this paper](https://www.iacr.org/archive/crypto2004/31520306/multicollisions.pdf) for more details.
+GxHash uses a 128-bit internal state. This makes GxHash [a widepipe construction](https://en.wikipedia.org/wiki/Merkle%E2%80%93Damg%C3%A5rd_construction#Wide_pipe_construction) when generating hashes of size 64-bit or smaller, which had amongst other properties to be inherently more resistant to multicollision attacks. See [this paper](https://www.iacr.org/archive/crypto2004/31520306/multicollisions.pdf) for more details.
 
 ### Cryptographic Properties
 GxHash is a non-cryptographic hashing algorithm, thus it is not recommended to use it as a cryptographic algorithm (it is not a replacement for SHA). It has not been assessed if GxHash is preimage resistant and how difficult it is to be reversed.
@@ -103,4 +103,4 @@ Publication:
 [PDF](https://github.com/ogxd/gxhash-rust/blob/main/article/article.pdf)
 
 Cite this publication / algorithm:  
-[![DOI](https://zenodo.org/badge/690754256.svg)](https://zenodo.org/badge/latestdoi/690754256)
+[![DOI](https://zenodo.org/badge/690754256.svg)](https://zenodo.org/badge/latestdoi/690754256)
\ No newline at end of file
diff --git a/benches/throughput/aarch64.svg b/benches/throughput/aarch64.svg
index 63c9d27..541e304 100644
--- a/benches/throughput/aarch64.svg
+++ b/benches/throughput/aarch64.svg
@@ -4,12 +4,13 @@
 Throughput (aarch64)
 </text>
 <line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="359" x2="579" y2="359"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="307" x2="579" y2="307"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="255" x2="579" y2="255"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="203" x2="579" y2="203"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="151" x2="579" y2="151"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="98" x2="579" y2="98"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="46" x2="579" y2="46"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="314" x2="579" y2="314"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="268" x2="579" y2="268"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="222" x2="579" y2="222"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="177" x2="579" y2="177"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="131" x2="579" y2="131"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="85" x2="579" y2="85"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="39" x2="579" y2="39"/>
 <text x="0" y="193" dy="0.76em" text-anchor="middle" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000" transform="rotate(270, 0, 193)">
 Throughput (MiB/s)
 </text>
@@ -31,41 +32,46 @@ Input Size (bytes)
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="538" y1="359" x2="538" y2="26"/>
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="579" y1="359" x2="579" y2="26"/>
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="359" x2="579" y2="359"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="307" x2="579" y2="307"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="255" x2="579" y2="255"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="203" x2="579" y2="203"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="151" x2="579" y2="151"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="98" x2="579" y2="98"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="46" x2="579" y2="46"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="314" x2="579" y2="314"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="268" x2="579" y2="268"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="222" x2="579" y2="222"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="177" x2="579" y2="177"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="131" x2="579" y2="131"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="85" x2="579" y2="85"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="39" x2="579" y2="39"/>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="55,26 55,359 "/>
 <text x="46" y="359" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 0
 </text>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,359 55,359 "/>
-<text x="46" y="307" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="46" y="314" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 5000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,307 55,307 "/>
-<text x="46" y="255" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,314 55,314 "/>
+<text x="46" y="268" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 10000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,255 55,255 "/>
-<text x="46" y="203" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,268 55,268 "/>
+<text x="46" y="222" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 15000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,203 55,203 "/>
-<text x="46" y="151" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,222 55,222 "/>
+<text x="46" y="177" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 20000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,151 55,151 "/>
-<text x="46" y="98" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,177 55,177 "/>
+<text x="46" y="131" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 25000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,98 55,98 "/>
-<text x="46" y="46" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,131 55,131 "/>
+<text x="46" y="85" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 30000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,46 55,46 "/>
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,85 55,85 "/>
+<text x="46" y="39" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+35000
+</text>
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,39 55,39 "/>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="56,360 579,360 "/>
 <text x="56" y="370" dy="0.76em" text-anchor="middle" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 4
@@ -123,14 +129,14 @@ Input Size (bytes)
 32768
 </text>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="579,360 579,365 "/>
-<polyline fill="none" opacity="1" stroke="#E6194B" stroke-width="2" points="56,341 96,323 136,287 176,282 216,250 257,183 297,119 337,88 377,66 418,56 458,49 498,43 538,42 579,43 "/>
-<polyline fill="none" opacity="1" stroke="#3CB44B" stroke-width="2" points="56,352 96,344 136,328 176,314 216,304 257,298 297,313 337,304 377,281 418,274 458,268 498,266 538,264 579,264 "/>
-<polyline fill="none" opacity="1" stroke="#FFE119" stroke-width="2" points="56,355 96,350 136,340 176,329 216,317 257,307 297,300 337,296 377,294 418,293 458,292 498,292 538,292 579,291 "/>
-<polyline fill="none" opacity="1" stroke="#0082C8" stroke-width="2" points="56,354 96,348 136,341 176,335 216,309 257,286 297,266 337,249 377,238 418,232 458,229 498,227 538,225 579,225 "/>
-<polyline fill="none" opacity="1" stroke="#F58230" stroke-width="2" points="56,355 96,350 136,344 176,336 216,328 257,322 297,321 337,320 377,320 418,320 458,320 498,320 538,320 579,320 "/>
-<polyline fill="none" opacity="1" stroke="#911EB4" stroke-width="2" points="56,355 96,350 136,346 176,341 216,330 257,316 297,303 337,293 377,287 418,284 458,282 498,281 538,280 579,280 "/>
-<polyline fill="none" opacity="1" stroke="#46F0F0" stroke-width="2" points="56,359 96,358 136,356 176,353 216,347 257,339 297,330 337,322 377,316 418,312 458,309 498,308 538,307 579,307 "/>
-<polyline fill="none" opacity="1" stroke="#F032E6" stroke-width="2" points="56,350 96,350 136,350 176,351 216,353 257,353 297,353 337,353 377,354 418,354 458,354 498,354 538,354 579,354 "/>
+<polyline fill="none" opacity="1" stroke="#E6194B" stroke-width="2" points="56,344 96,328 136,296 176,262 216,244 257,252 297,184 337,128 377,96 418,69 458,47 498,46 538,42 579,44 "/>
+<polyline fill="none" opacity="1" stroke="#3CB44B" stroke-width="2" points="56,353 96,346 136,332 176,320 216,311 257,306 297,318 337,310 377,289 418,284 458,279 498,278 538,276 579,275 "/>
+<polyline fill="none" opacity="1" stroke="#FFE119" stroke-width="2" points="56,355 96,351 136,342 176,333 216,322 257,314 297,308 337,304 377,302 418,301 458,300 498,300 538,300 579,300 "/>
+<polyline fill="none" opacity="1" stroke="#0082C8" stroke-width="2" points="56,355 96,350 136,344 176,338 216,315 257,295 297,277 337,263 377,253 418,248 458,245 498,243 538,242 579,241 "/>
+<polyline fill="none" opacity="1" stroke="#F58230" stroke-width="2" points="56,356 96,351 136,346 176,339 216,332 257,327 297,326 337,325 377,325 418,325 458,325 498,325 538,325 579,325 "/>
+<polyline fill="none" opacity="1" stroke="#911EB4" stroke-width="2" points="56,355 96,351 136,348 176,344 216,334 257,321 297,310 337,302 377,296 418,293 458,292 498,291 538,290 579,290 "/>
+<polyline fill="none" opacity="1" stroke="#46F0F0" stroke-width="2" points="56,359 96,358 136,357 176,353 216,349 257,342 297,334 337,327 377,321 418,318 458,316 498,314 538,314 579,313 "/>
+<polyline fill="none" opacity="1" stroke="#F032E6" stroke-width="2" points="56,351 96,351 136,351 176,352 216,353 257,354 297,354 337,354 377,354 418,354 458,354 498,354 538,354 579,354 "/>
 <rect x="465" y="125" width="110" height="135" opacity="0.7" fill="#FFFFFF" stroke="none"/>
 <rect x="465" y="125" width="110" height="135" opacity="1" fill="none" stroke="#000000"/>
 <text x="505" y="135" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
diff --git a/benches/throughput/main.rs b/benches/throughput/main.rs
index 3b78fa7..3a48963 100644
--- a/benches/throughput/main.rs
+++ b/benches/throughput/main.rs
@@ -38,7 +38,7 @@ fn main() {
     };
 
     // GxHash
-    let gxhash_name = if cfg!(feature = "avx2") { "gxhash-avx2" } else { "gxhash" };
+    let gxhash_name = if cfg!(hybrid) { "gxhash-hybrid" } else { "gxhash" };
     benchmark(processor.as_mut(), slice, gxhash_name, |data: &[u8], seed: i64| -> u64 {
         gxhash64(data, seed)
     });
diff --git a/benches/throughput/result_processor.rs b/benches/throughput/result_processor.rs
index 49bece6..2b15546 100644
--- a/benches/throughput/result_processor.rs
+++ b/benches/throughput/result_processor.rs
@@ -120,8 +120,8 @@ impl ResultProcessor for OutputPlot {
 
     fn finish(&self) {
         let mut arch = std::env::consts::ARCH.to_string();
-        if cfg!(feature = "avx2") {
-            arch += "-avx2";
+        if cfg!(hybrid) {
+            arch += "-hybrid";
         }
         let file_name = format!("benches/throughput/{}.svg", arch);
 
@@ -176,6 +176,6 @@ impl ResultProcessor for OutputPlot {
         // To avoid the IO failure being ignored silently, we manually call the present function
         canvas.present().expect("Unable to write result to file, please make sure 'plotters-doc-data' dir exists under current dir");
 
-        println!("Finished");
+        println!("Finished: '{}'", file_name);
     }
 }
\ No newline at end of file
diff --git a/benches/throughput/x86_64-avx2.svg b/benches/throughput/x86_64-hybrid.svg
similarity index 72%
rename from benches/throughput/x86_64-avx2.svg
rename to benches/throughput/x86_64-hybrid.svg
index 3e769ce..918f5c7 100644
--- a/benches/throughput/x86_64-avx2.svg
+++ b/benches/throughput/x86_64-hybrid.svg
@@ -1,17 +1,16 @@
 <svg width="600" height="400" viewBox="0 0 600 400" xmlns="http://www.w3.org/2000/svg">
 <rect x="0" y="0" width="600" height="400" opacity="1" fill="#FFFFFF" stroke="none"/>
 <text x="290" y="5" dy="0.76em" text-anchor="middle" font-family="sans-serif" font-size="16.129032258064516" opacity="1" fill="#000000">
-Throughput (x86_64-avx2)
+Throughput (x86_64-hybrid)
 </text>
 <line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="359" x2="579" y2="359"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="322" x2="579" y2="322"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="285" x2="579" y2="285"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="248" x2="579" y2="248"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="210" x2="579" y2="210"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="173" x2="579" y2="173"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="136" x2="579" y2="136"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="98" x2="579" y2="98"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="61" x2="579" y2="61"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="313" x2="579" y2="313"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="267" x2="579" y2="267"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="220" x2="579" y2="220"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="174" x2="579" y2="174"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="127" x2="579" y2="127"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="81" x2="579" y2="81"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="35" x2="579" y2="35"/>
 <text x="0" y="193" dy="0.76em" text-anchor="middle" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000" transform="rotate(270, 0, 193)">
 Throughput (MiB/s)
 </text>
@@ -33,51 +32,46 @@ Input Size (bytes)
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="538" y1="359" x2="538" y2="26"/>
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="579" y1="359" x2="579" y2="26"/>
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="359" x2="579" y2="359"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="322" x2="579" y2="322"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="285" x2="579" y2="285"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="248" x2="579" y2="248"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="210" x2="579" y2="210"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="173" x2="579" y2="173"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="136" x2="579" y2="136"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="98" x2="579" y2="98"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="61" x2="579" y2="61"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="313" x2="579" y2="313"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="267" x2="579" y2="267"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="220" x2="579" y2="220"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="174" x2="579" y2="174"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="127" x2="579" y2="127"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="81" x2="579" y2="81"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="35" x2="579" y2="35"/>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="55,26 55,359 "/>
 <text x="46" y="359" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 0
 </text>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,359 55,359 "/>
-<text x="46" y="322" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="46" y="313" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 20000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,322 55,322 "/>
-<text x="46" y="285" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,313 55,313 "/>
+<text x="46" y="267" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 40000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,285 55,285 "/>
-<text x="46" y="248" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,267 55,267 "/>
+<text x="46" y="220" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 60000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,248 55,248 "/>
-<text x="46" y="210" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,220 55,220 "/>
+<text x="46" y="174" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 80000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,210 55,210 "/>
-<text x="46" y="173" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,174 55,174 "/>
+<text x="46" y="127" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 100000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,173 55,173 "/>
-<text x="46" y="136" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,127 55,127 "/>
+<text x="46" y="81" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 120000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,136 55,136 "/>
-<text x="46" y="98" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,81 55,81 "/>
+<text x="46" y="35" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 140000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,98 55,98 "/>
-<text x="46" y="61" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
-160000
-</text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,61 55,61 "/>
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,35 55,35 "/>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="56,360 579,360 "/>
 <text x="56" y="370" dy="0.76em" text-anchor="middle" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 4
@@ -135,46 +129,46 @@ Input Size (bytes)
 32768
 </text>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="579,360 579,365 "/>
-<polyline fill="none" opacity="1" stroke="#E6194B" stroke-width="2" points="56,349 96,338 136,317 176,273 216,248 257,242 297,246 337,212 377,159 418,117 458,82 498,66 538,49 579,42 "/>
-<polyline fill="none" opacity="1" stroke="#3CB44B" stroke-width="2" points="56,357 96,355 136,348 176,339 216,328 257,318 297,330 337,323 377,318 418,319 458,320 498,320 538,320 579,320 "/>
-<polyline fill="none" opacity="1" stroke="#FFE119" stroke-width="2" points="56,355 96,351 136,339 176,322 216,307 257,311 297,294 337,281 377,267 418,265 458,265 498,265 538,266 579,266 "/>
-<polyline fill="none" opacity="1" stroke="#0082C8" stroke-width="2" points="56,358 96,356 136,352 176,349 216,337 257,321 297,295 337,256 377,225 418,200 458,185 498,177 538,169 579,172 "/>
-<polyline fill="none" opacity="1" stroke="#F58230" stroke-width="2" points="56,359 96,359 136,358 176,356 216,354 257,351 297,349 337,348 377,347 418,347 458,346 498,346 538,346 579,346 "/>
-<polyline fill="none" opacity="1" stroke="#911EB4" stroke-width="2" points="56,358 96,356 136,356 176,350 216,343 257,337 297,331 337,325 377,322 418,320 458,320 498,319 538,319 579,319 "/>
-<polyline fill="none" opacity="1" stroke="#46F0F0" stroke-width="2" points="56,359 96,359 136,358 176,355 216,352 257,347 297,342 337,336 377,332 418,329 458,328 498,327 538,326 579,326 "/>
-<polyline fill="none" opacity="1" stroke="#F032E6" stroke-width="2" points="56,356 96,353 136,354 176,355 216,356 257,357 297,357 337,357 377,357 418,357 458,357 498,357 538,357 579,357 "/>
-<rect x="465" y="125" width="110" height="135" opacity="0.7" fill="#FFFFFF" stroke="none"/>
-<rect x="465" y="125" width="110" height="135" opacity="1" fill="none" stroke="#000000"/>
-<text x="505" y="135" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
-gxhash-avx2
-</text>
-<text x="505" y="150" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#E6194B" stroke-width="2" points="56,342 96,323 136,288 176,277 216,236 257,260 297,210 337,146 377,91 418,56 458,43 498,42 538,45 579,65 "/>
+<polyline fill="none" opacity="1" stroke="#3CB44B" stroke-width="2" points="56,357 96,354 136,347 176,336 216,323 257,311 297,325 337,316 377,309 418,312 458,313 498,313 538,313 579,314 "/>
+<polyline fill="none" opacity="1" stroke="#FFE119" stroke-width="2" points="56,354 96,349 136,335 176,316 216,296 257,300 297,282 337,267 377,250 418,249 458,249 498,250 538,250 579,250 "/>
+<polyline fill="none" opacity="1" stroke="#0082C8" stroke-width="2" points="56,357 96,356 136,352 176,348 216,332 257,315 297,283 337,238 377,201 418,175 458,156 498,147 538,137 579,142 "/>
+<polyline fill="none" opacity="1" stroke="#F58230" stroke-width="2" points="56,359 96,358 136,357 176,355 216,352 257,350 297,347 337,346 377,345 418,344 458,344 498,344 538,344 579,344 "/>
+<polyline fill="none" opacity="1" stroke="#911EB4" stroke-width="2" points="56,357 96,355 136,355 176,347 216,340 257,331 297,325 337,318 377,314 418,312 458,313 498,312 538,311 579,310 "/>
+<polyline fill="none" opacity="1" stroke="#46F0F0" stroke-width="2" points="56,359 96,359 136,358 176,355 216,351 257,345 297,338 337,332 377,326 418,322 458,321 498,320 538,320 579,320 "/>
+<polyline fill="none" opacity="1" stroke="#F032E6" stroke-width="2" points="56,354 96,352 136,353 176,354 216,356 257,356 297,357 337,357 377,357 418,357 458,357 498,357 538,357 579,357 "/>
+<rect x="454" y="125" width="121" height="135" opacity="0.7" fill="#FFFFFF" stroke="none"/>
+<rect x="454" y="125" width="121" height="135" opacity="1" fill="none" stroke="#000000"/>
+<text x="494" y="135" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+gxhash-hybrid
+</text>
+<text x="494" y="150" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 xxhash
 </text>
-<text x="505" y="165" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="494" y="165" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 ahash
 </text>
-<text x="505" y="180" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="494" y="180" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 t1ha0
 </text>
-<text x="505" y="195" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="494" y="195" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 seahash
 </text>
-<text x="505" y="210" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="494" y="210" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 metrohash
 </text>
-<text x="505" y="225" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="494" y="225" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 highwayhash
 </text>
-<text x="505" y="240" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="494" y="240" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 fnv-1a
 </text>
-<rect x="475" y="135" width="10" height="10" opacity="1" fill="#E6194B" stroke="none"/>
-<rect x="475" y="150" width="10" height="10" opacity="1" fill="#3CB44B" stroke="none"/>
-<rect x="475" y="165" width="10" height="10" opacity="1" fill="#FFE119" stroke="none"/>
-<rect x="475" y="180" width="10" height="10" opacity="1" fill="#0082C8" stroke="none"/>
-<rect x="475" y="195" width="10" height="10" opacity="1" fill="#F58230" stroke="none"/>
-<rect x="475" y="210" width="10" height="10" opacity="1" fill="#911EB4" stroke="none"/>
-<rect x="475" y="225" width="10" height="10" opacity="1" fill="#46F0F0" stroke="none"/>
-<rect x="475" y="240" width="10" height="10" opacity="1" fill="#F032E6" stroke="none"/>
+<rect x="464" y="135" width="10" height="10" opacity="1" fill="#E6194B" stroke="none"/>
+<rect x="464" y="150" width="10" height="10" opacity="1" fill="#3CB44B" stroke="none"/>
+<rect x="464" y="165" width="10" height="10" opacity="1" fill="#FFE119" stroke="none"/>
+<rect x="464" y="180" width="10" height="10" opacity="1" fill="#0082C8" stroke="none"/>
+<rect x="464" y="195" width="10" height="10" opacity="1" fill="#F58230" stroke="none"/>
+<rect x="464" y="210" width="10" height="10" opacity="1" fill="#911EB4" stroke="none"/>
+<rect x="464" y="225" width="10" height="10" opacity="1" fill="#46F0F0" stroke="none"/>
+<rect x="464" y="240" width="10" height="10" opacity="1" fill="#F032E6" stroke="none"/>
 </svg>
diff --git a/benches/throughput/x86_64.svg b/benches/throughput/x86_64.svg
index 16a5047..0a34d6c 100644
--- a/benches/throughput/x86_64.svg
+++ b/benches/throughput/x86_64.svg
@@ -4,16 +4,11 @@
 Throughput (x86_64)
 </text>
 <line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="359" x2="579" y2="359"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="328" x2="579" y2="328"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="297" x2="579" y2="297"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="265" x2="579" y2="265"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="234" x2="579" y2="234"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="202" x2="579" y2="202"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="171" x2="579" y2="171"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="139" x2="579" y2="139"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="108" x2="579" y2="108"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="76" x2="579" y2="76"/>
-<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="45" x2="579" y2="45"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="302" x2="579" y2="302"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="244" x2="579" y2="244"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="186" x2="579" y2="186"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="128" x2="579" y2="128"/>
+<line opacity="0.1" stroke="#000000" stroke-width="1" x1="56" y1="70" x2="579" y2="70"/>
 <text x="0" y="193" dy="0.76em" text-anchor="middle" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000" transform="rotate(270, 0, 193)">
 Throughput (MiB/s)
 </text>
@@ -35,61 +30,36 @@ Input Size (bytes)
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="538" y1="359" x2="538" y2="26"/>
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="579" y1="359" x2="579" y2="26"/>
 <line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="359" x2="579" y2="359"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="328" x2="579" y2="328"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="297" x2="579" y2="297"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="265" x2="579" y2="265"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="234" x2="579" y2="234"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="202" x2="579" y2="202"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="171" x2="579" y2="171"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="139" x2="579" y2="139"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="108" x2="579" y2="108"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="76" x2="579" y2="76"/>
-<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="45" x2="579" y2="45"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="302" x2="579" y2="302"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="244" x2="579" y2="244"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="186" x2="579" y2="186"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="128" x2="579" y2="128"/>
+<line opacity="0.2" stroke="#000000" stroke-width="1" x1="56" y1="70" x2="579" y2="70"/>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="55,26 55,359 "/>
 <text x="46" y="359" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 0
 </text>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,359 55,359 "/>
-<text x="46" y="328" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
-10000
-</text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,328 55,328 "/>
-<text x="46" y="297" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<text x="46" y="302" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 20000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,297 55,297 "/>
-<text x="46" y="265" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
-30000
-</text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,265 55,265 "/>
-<text x="46" y="234" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,302 55,302 "/>
+<text x="46" y="244" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 40000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,234 55,234 "/>
-<text x="46" y="202" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
-50000
-</text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,202 55,202 "/>
-<text x="46" y="171" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,244 55,244 "/>
+<text x="46" y="186" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 60000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,171 55,171 "/>
-<text x="46" y="139" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
-70000
-</text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,139 55,139 "/>
-<text x="46" y="108" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,186 55,186 "/>
+<text x="46" y="128" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 80000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,108 55,108 "/>
-<text x="46" y="76" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
-90000
-</text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,76 55,76 "/>
-<text x="46" y="45" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,128 55,128 "/>
+<text x="46" y="70" dy="0.5ex" text-anchor="end" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 100000
 </text>
-<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,45 55,45 "/>
+<polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="50,70 55,70 "/>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="56,360 579,360 "/>
 <text x="56" y="370" dy="0.76em" text-anchor="middle" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
 4
@@ -147,14 +117,14 @@ Input Size (bytes)
 32768
 </text>
 <polyline fill="none" opacity="1" stroke="#000000" stroke-width="1" points="579,360 579,365 "/>
-<polyline fill="none" opacity="1" stroke="#E6194B" stroke-width="2" points="56,334 96,309 136,258 176,243 216,240 257,240 297,211 337,167 377,133 418,103 458,90 498,69 538,57 579,57 "/>
-<polyline fill="none" opacity="1" stroke="#3CB44B" stroke-width="2" points="56,355 96,351 136,341 176,328 216,311 257,292 297,310 337,297 377,284 418,286 458,287 498,288 538,288 579,289 "/>
-<polyline fill="none" opacity="1" stroke="#FFE119" stroke-width="2" points="56,352 96,345 136,324 176,296 216,270 257,276 297,248 337,226 377,202 418,199 458,199 498,201 538,200 579,202 "/>
-<polyline fill="none" opacity="1" stroke="#0082C8" stroke-width="2" points="56,356 96,352 136,346 176,339 216,319 257,291 297,239 337,179 377,121 418,96 458,71 498,49 538,42 579,47 "/>
-<polyline fill="none" opacity="1" stroke="#F58230" stroke-width="2" points="56,359 96,358 136,356 176,353 216,349 257,346 297,342 337,340 377,338 418,338 458,337 498,337 538,337 579,337 "/>
-<polyline fill="none" opacity="1" stroke="#911EB4" stroke-width="2" points="56,356 96,353 136,353 176,342 216,331 257,320 297,310 337,301 377,296 418,294 458,294 498,292 538,292 579,291 "/>
-<polyline fill="none" opacity="1" stroke="#46F0F0" stroke-width="2" points="56,359 96,359 136,358 176,352 216,347 257,339 297,329 337,319 377,312 418,307 458,304 498,303 538,302 579,302 "/>
-<polyline fill="none" opacity="1" stroke="#F032E6" stroke-width="2" points="56,351 96,348 136,350 176,352 216,354 257,355 297,356 337,356 377,356 418,356 458,356 498,356 538,356 579,356 "/>
+<polyline fill="none" opacity="1" stroke="#E6194B" stroke-width="2" points="56,339 96,318 136,276 176,263 216,202 257,177 297,120 337,89 377,75 418,61 458,52 498,42 538,43 579,47 "/>
+<polyline fill="none" opacity="1" stroke="#3CB44B" stroke-width="2" points="56,355 96,350 136,339 176,323 216,304 257,291 297,302 337,290 377,275 418,281 458,286 498,288 538,289 579,290 "/>
+<polyline fill="none" opacity="1" stroke="#FFE119" stroke-width="2" points="56,352 96,344 136,322 176,295 216,270 257,280 297,251 337,238 377,225 418,228 458,234 498,237 538,238 579,240 "/>
+<polyline fill="none" opacity="1" stroke="#0082C8" stroke-width="2" points="56,356 96,352 136,346 176,336 216,313 257,274 297,214 337,139 377,99 418,91 458,70 498,55 538,48 579,49 "/>
+<polyline fill="none" opacity="1" stroke="#F58230" stroke-width="2" points="56,359 96,358 136,356 176,352 216,347 257,340 297,332 337,326 377,321 418,319 458,317 498,316 538,316 579,316 "/>
+<polyline fill="none" opacity="1" stroke="#911EB4" stroke-width="2" points="56,356 96,353 136,353 176,339 216,323 257,296 297,272 337,261 377,264 418,267 458,269 498,270 538,271 579,271 "/>
+<polyline fill="none" opacity="1" stroke="#46F0F0" stroke-width="2" points="56,359 96,359 136,358 176,355 216,351 257,342 297,334 337,326 377,320 418,317 458,314 498,313 538,312 579,312 "/>
+<polyline fill="none" opacity="1" stroke="#F032E6" stroke-width="2" points="56,350 96,349 136,351 176,353 216,355 257,356 297,356 337,356 377,356 418,356 458,356 498,356 538,356 579,356 "/>
 <rect x="465" y="125" width="110" height="135" opacity="0.7" fill="#FFFFFF" stroke="none"/>
 <rect x="465" y="125" width="110" height="135" opacity="1" fill="none" stroke="#000000"/>
 <text x="505" y="135" dy="0.76em" text-anchor="start" font-family="sans-serif" font-size="9.67741935483871" opacity="1" fill="#000000">
diff --git a/benches/throughput_criterion.rs b/benches/throughput_criterion.rs
index f999da6..7d355fa 100644
--- a/benches/throughput_criterion.rs
+++ b/benches/throughput_criterion.rs
@@ -44,8 +44,8 @@ fn benchmark_all(c: &mut Criterion) {
     group.plot_config(plot_config);
 
     // GxHash
-    let algo_name = if cfg!(feature = "avx2") { "gxhash-avx2" } else { "gxhash" };
-    benchmark(&mut group, slice, algo_name, |data: &[u8], seed: i32| -> u64 {
+    let gxhash_name = if cfg!(hybrid) { "gxhash-hybrid" } else { "gxhash" };
+    benchmark(&mut group, slice, gxhash_name, |data: &[u8], seed: i32| -> u64 {
         gxhash64(data, seed as i64)
     });
     
diff --git a/build.rs b/build.rs
new file mode 100644
index 0000000..dd11580
--- /dev/null
+++ b/build.rs
@@ -0,0 +1,11 @@
+extern crate rustc_version;
+use rustc_version::{version_meta, Channel};
+
+fn main() {
+    if version_meta().unwrap().channel == Channel::Nightly
+    && cfg!(target_arch = "x86_64")
+    && cfg!(target_feature = "avx2")
+    && cfg!(target_feature = "vaes") {
+        println!("cargo:rustc-cfg=hybrid");
+    }
+}
\ No newline at end of file
diff --git a/src/gxhash/mod.rs b/src/gxhash/mod.rs
index a3d7fd2..dd117ae 100644
--- a/src/gxhash/mod.rs
+++ b/src/gxhash/mod.rs
@@ -63,37 +63,36 @@ macro_rules! load_unaligned {
     };
 }
 
+pub(crate) use load_unaligned;
+
 #[inline(always)]
 pub(crate) unsafe fn gxhash(input: &[u8], seed: State) -> State {
-    finalize(compress_fast(compress_all(input), seed))
+    finalize(aes_encrypt(compress_all(input), seed))
 }
 
 #[inline(always)]
 pub(crate) unsafe fn compress_all(input: &[u8]) -> State {
 
     let len = input.len();
+    let mut ptr = input.as_ptr() as *const State;
 
     if len == 0 {
         return create_empty();
     }
 
-    let mut ptr = input.as_ptr() as *const State;
-
     if len <= VECTOR_SIZE {
         // Input fits on a single SIMD vector, however we might read beyond the input message
         // Thus we need this safe method that checks if it can safely read beyond or must copy
         return get_partial(ptr, len);
     }
 
-    let extra_bytes_count = len % VECTOR_SIZE;
-    let remaining_bytes: usize;
+    let mut hash_vector: State;
+    let end = ptr as usize + len;
 
-    // The input does not fit on a single SIMD vector
-    let hash_vector: State;
+    let extra_bytes_count = len % VECTOR_SIZE;
     if extra_bytes_count == 0 {
         load_unaligned!(ptr, v0);
         hash_vector = v0;
-        remaining_bytes = len - VECTOR_SIZE;
     } else {
         // If the input length does not match the length of a whole number of SIMD vectors,
         // it means we'll need to read a partial vector. We can start with the partial vector first,
@@ -101,57 +100,53 @@ pub(crate) unsafe fn compress_all(input: &[u8]) -> State {
         // the input
         hash_vector = get_partial_unsafe(ptr, extra_bytes_count);
         ptr = ptr.cast::<u8>().add(extra_bytes_count).cast();
-        remaining_bytes = len - extra_bytes_count;
     }
 
-    #[allow(unused_assignments)]
-    if len <= VECTOR_SIZE * 2 {
-        // Fast path when input length > 16 and <= 32
-        load_unaligned!(ptr, v0);
-        compress(hash_vector, v0)
-    } else if len <= VECTOR_SIZE * 3 {
+    load_unaligned!(ptr, v0);
+
+    if len > VECTOR_SIZE * 2 {
         // Fast path when input length > 32 and <= 48
-        load_unaligned!(ptr, v0, v1);
-        compress(hash_vector, compress(v0, v1))
-    } else {
-        // Input message is large and we can use the high ILP loop
-        compress_many(ptr, hash_vector, remaining_bytes)
+        load_unaligned!(ptr, v);
+        v0 = aes_encrypt(v0, v);
+
+        if len > VECTOR_SIZE * 3 {
+            // Fast path when input length > 48 and <= 64
+            load_unaligned!(ptr, v);
+            v0 = aes_encrypt(v0, v);
+
+            if len > VECTOR_SIZE * 4 {
+                // Input message is large and we can use the high ILP loop
+                hash_vector = compress_many(ptr, end, hash_vector, len);
+            }
+        }
     }
+    
+    return aes_encrypt_last(hash_vector, 
+        aes_encrypt(aes_encrypt(v0, ld(KEYS.as_ptr())), ld(KEYS.as_ptr().offset(4))));
 }
 
 #[inline(always)]
-unsafe fn compress_many(mut ptr: *const State, hash_vector: State, remaining_bytes: usize) -> State {
+unsafe fn compress_many(mut ptr: *const State, end: usize, hash_vector: State, len: usize) -> State {
 
     const UNROLL_FACTOR: usize = 8;
 
-    let unrollable_blocks_count: usize = remaining_bytes / (VECTOR_SIZE * UNROLL_FACTOR) * UNROLL_FACTOR; 
-    let end_address = ptr.add(unrollable_blocks_count) as usize;
-    let mut hash_vector = hash_vector;
-    while (ptr as usize) < end_address {
+    let remaining_bytes = end -  ptr as usize;
 
-        load_unaligned!(ptr, v0, v1, v2, v3, v4, v5, v6, v7);
-
-        let mut tmp: State;
-        tmp = compress_fast(v0, v1);
-        tmp = compress_fast(tmp, v2);
-        tmp = compress_fast(tmp, v3);
-        tmp = compress_fast(tmp, v4);
-        tmp = compress_fast(tmp, v5);
-        tmp = compress_fast(tmp, v6);
-        tmp = compress_fast(tmp, v7);
-
-        hash_vector = compress(hash_vector, tmp);
-    }
+    let unrollable_blocks_count: usize = remaining_bytes / (VECTOR_SIZE * UNROLL_FACTOR) * UNROLL_FACTOR; 
 
     let remaining_bytes = remaining_bytes - unrollable_blocks_count * VECTOR_SIZE;
     let end_address = ptr.add(remaining_bytes / VECTOR_SIZE) as usize;
 
+    // Process first individual blocks until we have an whole number of 8 blocks
+    let mut hash_vector = hash_vector;
     while (ptr as usize) < end_address {
         load_unaligned!(ptr, v0);
-        hash_vector = compress(hash_vector, v0);
+        hash_vector = aes_encrypt(hash_vector, v0);
     }
 
-    hash_vector
+    // Process the remaining n * 8 blocks
+    // This part may use 128-bit or 256-bit
+    compress_8(ptr, end, hash_vector, len)
 }
 
 #[cfg(test)]
@@ -294,7 +289,7 @@ mod tests {
     fn is_stable() {
         assert_eq!(456576800, gxhash32(&[0u8; 0], 0));
         assert_eq!(978957914, gxhash32(&[0u8; 1], 0));
-        assert_eq!(3325885698, gxhash32(&[0u8; 1000], 0));
-        assert_eq!(3805815999, gxhash32(&[42u8; 4242], 42));
+        assert_eq!(2252110365, gxhash32(&[0u8; 1000], 0));
+        assert_eq!(2426107958, gxhash32(&[42u8; 4242], 42));
     }
 }
diff --git a/src/gxhash/platform/arm_128.rs b/src/gxhash/platform/aarch64.rs
similarity index 59%
rename from src/gxhash/platform/arm_128.rs
rename to src/gxhash/platform/aarch64.rs
index 4cb452d..b314a61 100644
--- a/src/gxhash/platform/arm_128.rs
+++ b/src/gxhash/platform/aarch64.rs
@@ -4,15 +4,6 @@ use super::*;
 
 pub type State = int8x16_t;
 
-#[repr(C)]
-union ReinterpretUnion {
-    int64: int64x2_t,
-    int32: int32x4_t,
-    uint32: uint32x4_t,
-    int8: int8x16_t,
-    uint8: uint8x16_t,
-}
-
 #[inline(always)]
 pub unsafe fn create_empty() -> State {
     vdupq_n_s8(0)
@@ -52,45 +43,33 @@ pub unsafe fn get_partial_safe(data: *const State, len: usize) -> State {
 pub unsafe fn get_partial_unsafe(data: *const State, len: usize) -> State {
     let indices = vld1q_s8([0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15].as_ptr());
     let mask = vcgtq_s8(vdupq_n_s8(len as i8), indices);
-    let partial_vector = vandq_s8(load_unaligned(data), ReinterpretUnion { uint8: mask }.int8);
+    let partial_vector = vandq_s8(load_unaligned(data), vreinterpretq_s8_u8(mask));
     vaddq_s8(partial_vector, vdupq_n_s8(len as i8))
 }
 
 #[inline(always)]
-pub unsafe fn compress(a: int8x16_t, b: int8x16_t) -> int8x16_t {
-    let keys_1 = vld1q_u32([0xFC3BC28E, 0x89C222E5, 0xB09D3E21, 0xF2784542].as_ptr());
-    let keys_2 = vld1q_u32([0x03FCE279, 0xCB6B2E9B, 0xB361DC58, 0x39136BD9].as_ptr());
-
-    let mut bs = vreinterpretq_u8_s8(b);
-    bs = aes_encrypt(bs, vreinterpretq_u8_u32(keys_1));
-    bs = aes_encrypt(bs, vreinterpretq_u8_u32(keys_2));
-
-    vreinterpretq_s8_u8(aes_encrypt_last(vreinterpretq_u8_s8(a), bs))
-}
-
-#[inline(always)]
-pub unsafe fn compress_fast(a: int8x16_t, b: int8x16_t) -> int8x16_t {
-    vreinterpretq_s8_u8(aes_encrypt(vreinterpretq_u8_s8(a), vreinterpretq_u8_s8(b)))
+pub unsafe fn ld(array: *const u32) -> State {
+    vreinterpretq_s8_u32(vld1q_u32(array))
 }
 
 #[inline(always)]
 // See https://blog.michaelbrase.com/2018/05/08/emulating-x86-aes-intrinsics-on-armv8-a
-unsafe fn aes_encrypt(data: uint8x16_t, keys: uint8x16_t) -> uint8x16_t {
+pub unsafe fn aes_encrypt(data: State, keys: State) -> State {
     // Encrypt
-    let encrypted = vaeseq_u8(data, vdupq_n_u8(0));
+    let encrypted = vaeseq_u8(vreinterpretq_u8_s8(data), vdupq_n_u8(0));
     // Mix columns
     let mixed = vaesmcq_u8(encrypted);
     // Xor keys
-    veorq_u8(mixed, keys)
+    vreinterpretq_s8_u8(veorq_u8(mixed, vreinterpretq_u8_s8(keys)))
 }
 
 #[inline(always)]
 // See https://blog.michaelbrase.com/2018/05/08/emulating-x86-aes-intrinsics-on-armv8-a
-unsafe fn aes_encrypt_last(data: uint8x16_t, keys: uint8x16_t) -> uint8x16_t {
+pub unsafe fn aes_encrypt_last(data: State, keys: State) -> State {
     // Encrypt
-    let encrypted = vaeseq_u8(data, vdupq_n_u8(0));
+    let encrypted = vaeseq_u8(vreinterpretq_u8_s8(data), vdupq_n_u8(0));
     // Xor keys
-    veorq_u8(encrypted, keys)
+    vreinterpretq_s8_u8(veorq_u8(encrypted, vreinterpretq_u8_s8(keys)))
 }
 
 #[inline(always)]
@@ -101,12 +80,52 @@ pub unsafe fn finalize(hash: State) -> State {
     let keys_3 = vld1q_u32([0xC78B122B, 0x5544B1B7, 0x689D2B7D, 0xD0012E32].as_ptr());
 
     // 3 rounds of AES
-    let mut hash = ReinterpretUnion { int8: hash }.uint8;
-    hash = aes_encrypt(hash, ReinterpretUnion { uint32: keys_1 }.uint8);
-    hash = aes_encrypt(hash, ReinterpretUnion { uint32: keys_2 }.uint8);
-    hash = aes_encrypt_last(hash, ReinterpretUnion { uint32: keys_3 }.uint8);
+    let mut hash = hash;
+    hash = aes_encrypt(hash, vreinterpretq_s8_u32(keys_1));
+    hash = aes_encrypt(hash, vreinterpretq_s8_u32(keys_2));
+    hash = aes_encrypt_last(hash, vreinterpretq_s8_u32(keys_3));
+
+    hash
+}
+
+#[inline(always)]
+pub unsafe fn compress_8(mut ptr: *const State, end_address: usize, hash_vector: State, len: usize) -> State {
+
+    // Disambiguation vectors
+    let mut t1: State = create_empty();
+    let mut t2: State = create_empty();
+
+    // Hash is processed in two separate 128-bit parallel lanes
+    // This allows the same processing to be applied using 256-bit V-AES instrinsics
+    // so that hashes are stable in both cases. 
+    let mut lane1 = hash_vector;
+    let mut lane2 = hash_vector;
+
+    while (ptr as usize) < end_address {
+
+        crate::gxhash::load_unaligned!(ptr, v0, v1, v2, v3, v4, v5, v6, v7);
 
-    ReinterpretUnion { uint8: hash }.int8
+        let mut tmp1 = aes_encrypt(v0, v2);
+        let mut tmp2 = aes_encrypt(v1, v3);
+
+        tmp1 = aes_encrypt(tmp1, v4);
+        tmp2 = aes_encrypt(tmp2, v5);
+
+        tmp1 = aes_encrypt(tmp1, v6);
+        tmp2 = aes_encrypt(tmp2, v7);
+
+        t1 = vaddq_s8(t1, ld(KEYS.as_ptr()));
+        t2 = vaddq_s8(t2, ld(KEYS.as_ptr().offset(4)));
+
+        lane1 = aes_encrypt_last(aes_encrypt(tmp1, t1), lane1);
+        lane2 = aes_encrypt_last(aes_encrypt(tmp2, t2), lane2);
+    }
+    // For 'Zeroes' test
+    let len_vec =  vreinterpretq_s8_u32(vdupq_n_u32(len as u32));
+    lane1 = vaddq_s8(lane1, len_vec);
+    lane2 = vaddq_s8(lane2, len_vec);
+    // Merge lanes
+    aes_encrypt(lane1, lane2)
 }
 
 #[inline(always)]
diff --git a/src/gxhash/platform/mod.rs b/src/gxhash/platform/mod.rs
index adbfe87..97ecbab 100644
--- a/src/gxhash/platform/mod.rs
+++ b/src/gxhash/platform/mod.rs
@@ -1,19 +1,15 @@
 #[cfg(target_arch = "aarch64")]
-#[path = "arm_128.rs"]
+#[path = "aarch64.rs"]
 mod platform;
 
-#[cfg(all(feature = "avx2", target_arch = "x86_64", target_feature = "avx2"))]
-#[path = "x86_256.rs"]
+#[cfg(target_arch = "x86_64")]
+#[path = "x86_64.rs"]
 mod platform;
 
-#[cfg(all(not(feature = "avx2"), target_arch = "x86_64"))]
-#[path = "x86_128.rs"]
-mod platform;
+pub use platform::*;
 
 use std::mem::size_of;
 
-pub use platform::*;
-
 pub(crate) const VECTOR_SIZE: usize = size_of::<State>();
 // 4KiB is the default page size for most systems, and conservative for other systems such as MacOS ARM (16KiB)
 const PAGE_SIZE: usize = 0x1000;
@@ -26,3 +22,5 @@ unsafe fn check_same_page(ptr: *const State) -> bool {
     // Check if the 16nd byte from the current offset exceeds the page boundary
     offset_within_page < PAGE_SIZE - VECTOR_SIZE
 }
+
+pub const KEYS: [u32; 8] = [0xF2784542, 0xB09D3E21, 0x89C222E5, 0xFC3BC28E, 0x03FCE279, 0xCB6B2E9B, 0xB361DC58, 0x39132BD9];
\ No newline at end of file
diff --git a/src/gxhash/platform/x86_128.rs b/src/gxhash/platform/x86_128.rs
deleted file mode 100644
index 248d814..0000000
--- a/src/gxhash/platform/x86_128.rs
+++ /dev/null
@@ -1,135 +0,0 @@
-use core::arch::x86_64::*;
-
-use super::*;
-
-pub type State = __m128i;
-
-#[inline(always)]
-pub unsafe fn create_empty() -> State {
-    _mm_setzero_si128()
-}
-
-#[inline(always)]
-pub unsafe fn create_seed(seed: i64) -> State {
-    _mm_set1_epi64x(seed)
-}
-
-#[inline(always)]
-pub unsafe fn load_unaligned(p: *const State) -> State {
-    _mm_loadu_si128(p)
-}
-
-#[inline(always)]
-pub unsafe fn get_partial(p: *const State, len: usize) -> State {
-    // Safety check
-    if check_same_page(p) {
-        get_partial_unsafe(p, len)
-    } else {
-        get_partial_safe(p, len)
-    }
-}
-
-#[inline(always)]
-pub unsafe fn get_partial_safe(data: *const State, len: usize) -> State {
-    // Temporary buffer filled with zeros
-    let mut buffer = [0i8; VECTOR_SIZE];
-    // Copy data into the buffer
-    std::ptr::copy(data as *const i8, buffer.as_mut_ptr(), len);
-    // Load the buffer into a __m256i vector
-    let partial_vector = _mm_loadu_si128(buffer.as_ptr() as *const State);
-    _mm_add_epi8(partial_vector, _mm_set1_epi8(len as i8))
-}
-
-#[inline(always)]
-pub unsafe fn get_partial_unsafe(data: *const State, len: usize) -> State {
-    let indices = _mm_set_epi8(15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
-    let mask = _mm_cmpgt_epi8(_mm_set1_epi8(len as i8), indices);
-    let partial_vector = _mm_and_si128(_mm_loadu_si128(data), mask);
-    _mm_add_epi8(partial_vector, _mm_set1_epi8(len as i8))
-}
-
-#[inline(always)]
-#[allow(overflowing_literals)]
-pub unsafe fn compress(a: State, b: State) -> State {
-    let keys_1 = _mm_set_epi32(0xF2784542, 0xB09D3E21, 0x89C222E5, 0xFC3BC28E);
-    let keys_2 = _mm_set_epi32(0x39136BD9, 0xB361DC58, 0xCB6B2E9B, 0x03FCE279);
-
-    // 2+1 rounds of AES for compression
-    let mut b = _mm_aesenc_si128(b, keys_1);
-    b = _mm_aesenc_si128(b, keys_2);
-    _mm_aesenclast_si128(a, b)
-}
-
-#[inline(always)]
-#[allow(overflowing_literals)]
-pub unsafe fn compress_fast(a: State, b: State) -> State {
-    _mm_aesenc_si128(a, b)
-}
-
-#[inline(always)]
-#[allow(overflowing_literals)]
-pub unsafe fn finalize(hash: State) -> State {
-    // Hardcoded AES keys
-    let keys_1 = _mm_set_epi32(0x85459F85, 0xAF163956, 0x8F2F35DB, 0x713B01D0);
-    let keys_2 = _mm_set_epi32(0xB89C054F, 0x3DD99ACA, 0x92CFA39C, 0x1DE09647);
-    let keys_3 = _mm_set_epi32(0xD0012E32, 0x689D2B7D, 0x5544B1B7, 0xC78B122B);
-
-    // 4 rounds of AES
-    let mut hash = _mm_aesenc_si128(hash, keys_1);
-    hash = _mm_aesenc_si128(hash, keys_2);
-    hash = _mm_aesenclast_si128(hash, keys_3);
-
-    hash
-}
-
-#[inline(always)]
-pub unsafe fn load_u8(x: u8) -> State {
-    _mm_set1_epi8(x as i8)
-}
-
-#[inline(always)]
-pub unsafe fn load_u16(x: u16) -> State {
-    _mm_set1_epi16(x as i16)
-}
-
-#[inline(always)]
-pub unsafe fn load_u32(x: u32) -> State {
-    _mm_set1_epi32(x as i32)
-}
-
-#[inline(always)]
-pub unsafe fn load_u64(x: u64) -> State {
-    _mm_set1_epi64x(x as i64)
-}
-
-#[inline(always)]
-pub unsafe fn load_u128(x: u128) -> State {
-    let ptr = &x as *const u128 as *const State;
-    _mm_loadu_si128(ptr)
-}
-
-#[inline(always)]
-pub unsafe fn load_i8(x: i8) -> State {
-    _mm_set1_epi8(x)
-}
-
-#[inline(always)]
-pub unsafe fn load_i16(x: i16) -> State {
-    _mm_set1_epi16(x)
-}
-
-#[inline(always)]
-pub unsafe fn load_i32(x: i32) -> State {
-    _mm_set1_epi32(x)
-}
-
-#[inline(always)]
-pub unsafe fn load_i64(x: i64) -> State {
-    _mm_set1_epi64x(x)
-}
-
-#[inline(always)]
-pub unsafe fn load_i128(x: i128) -> State {
-    let ptr = &x as *const i128 as *const State;
-    _mm_loadu_si128(ptr)
-}
\ No newline at end of file
diff --git a/src/gxhash/platform/x86_256.rs b/src/gxhash/platform/x86_256.rs
deleted file mode 100644
index 0b5b785..0000000
--- a/src/gxhash/platform/x86_256.rs
+++ /dev/null
@@ -1,138 +0,0 @@
-use core::arch::x86_64::*;
-
-use super::*;
-
-pub type State = __m256i;
-
-#[inline(always)]
-pub unsafe fn create_empty() -> State {
-    _mm256_setzero_si256()
-}
-
-#[inline(always)]
-pub unsafe fn create_seed(seed: i64) -> State {
-    _mm256_set1_epi64x(seed)
-}
-
-#[inline(always)]
-pub unsafe fn load_unaligned(p: *const State) -> State {
-    _mm256_loadu_si256(p)
-}
-
-#[inline(always)]
-pub unsafe fn get_partial(p: *const State, len: usize) -> State {
-    // Safety check
-    if check_same_page(p) {
-        get_partial_unsafe(p, len as usize)
-    } else {
-        get_partial_safe(p, len as usize)
-    }
-}
-
-#[inline(always)]
-pub unsafe fn get_partial_safe(data: *const State, len: usize) -> State {
-    // Temporary buffer filled with zeros
-    let mut buffer = [0i8; VECTOR_SIZE];
-    // Copy data into the buffer
-    std::ptr::copy(data as *const i8, buffer.as_mut_ptr(), len);
-    // Load the buffer into a __m256i vector
-    let partial_vector = _mm256_loadu_si256(buffer.as_ptr() as *const State);
-    _mm256_add_epi8(partial_vector, _mm256_set1_epi8(len as i8))
-}
-
-#[inline(always)]
-pub unsafe fn get_partial_unsafe(data: *const State, len: usize) -> State {
-    let indices = _mm256_set_epi8(31, 30, 29, 28, 27, 26, 25, 24, 23, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
-    let mask = _mm256_cmpgt_epi8(_mm256_set1_epi8(len as i8), indices);
-    let partial_vector = _mm256_and_si256(_mm256_loadu_si256(data), mask);
-    _mm256_add_epi8(partial_vector, _mm256_set1_epi8(len as i8))
-}
-
-#[inline(always)]
-#[allow(overflowing_literals)]
-pub unsafe fn compress(a: State, b: State) -> State {
-    let keys_1 = _mm256_set_epi32(0xFC3BC28E, 0x89C222E5, 0xB09D3E21, 0xF2784542, 0x4155EE07, 0xC897CCE2, 0x780AF2C3, 0x8A72B781);
-    let keys_2 = _mm256_set_epi32(0x03FCE279, 0xCB6B2E9B, 0xB361DC58, 0x39136BD9, 0x7A83D76B, 0xB1E8F9F0, 0x028925A8, 0x3B9A4E71);
-
-    // 2+1 rounds of AES for compression
-    let mut b = _mm256_aesenc_epi128(b, keys_1);
-    b = _mm256_aesenc_epi128(b, keys_2);
-    return _mm256_aesenclast_epi128(a, b);
-}
-
-#[inline(always)]
-#[allow(overflowing_literals)]
-pub unsafe fn compress_fast(a: State, b: State) -> State {
-    return _mm256_aesenc_epi128(a, b);
-}
-
-#[inline(always)]
-#[allow(overflowing_literals)]
-pub unsafe fn finalize(hash: State) -> State {
-    // Hardcoded AES keys
-    let keys_1 = _mm256_set_epi32(0x713B01D0, 0x8F2F35DB, 0xAF163956, 0x85459F85, 0xB49D3E21, 0xF2784542, 0x2155EE07, 0xC197CCE2);
-    let keys_2 = _mm256_set_epi32(0x1DE09647, 0x92CFA39C, 0x3DD99ACA, 0xB89C054F, 0xCB6B2E9B, 0xC361DC58, 0x39136BD9, 0x7A83D76F);
-    let keys_3 = _mm256_set_epi32(0xC78B122B, 0x5544B1B7, 0x689D2B7D, 0xD0012E32, 0xE2784542, 0x4155EE07, 0xC897CCE2, 0x780BF2C2);
-
-    // 4 rounds of AES
-    let mut hash = _mm256_aesenc_epi128(hash, keys_1);
-    hash = _mm256_aesenc_epi128(hash, keys_2);
-    hash = _mm256_aesenclast_epi128(hash, keys_3);
-
-    let permuted = _mm256_permute2x128_si256(hash, hash, 0x21);
-    _mm256_xor_si256(hash, permuted)
-}
-
-#[inline(always)]
-pub unsafe fn load_u8(x: u8) -> State {
-    _mm256_set1_epi8(x as i8)
-}
-
-#[inline(always)]
-pub unsafe fn load_u16(x: u16) -> State {
-    _mm256_set1_epi16(x as i16)
-}
-
-#[inline(always)]
-pub unsafe fn load_u32(x: u32) -> State {
-    _mm256_set1_epi32(x as i32)
-}
-
-#[inline(always)]
-pub unsafe fn load_u64(x: u64) -> State {
-    _mm256_set1_epi64x(x as i64)
-}
-
-#[inline(always)]
-pub unsafe fn load_u128(x: u128) -> State {
-    let ptr = &x as *const u128 as *const __m128i;
-    let s128 = _mm_loadu_si128(ptr);
-    _mm256_set_m128i(s128, s128)
-}
-
-#[inline(always)]
-pub unsafe fn load_i8(x: i8) -> State {
-    _mm256_set1_epi8(x)
-}
-
-#[inline(always)]
-pub unsafe fn load_i16(x: i16) -> State {
-    _mm256_set1_epi16(x)
-}
-
-#[inline(always)]
-pub unsafe fn load_i32(x: i32) -> State {
-    _mm256_set1_epi32(x)
-}
-
-#[inline(always)]
-pub unsafe fn load_i64(x: i64) -> State {
-    _mm256_set1_epi64x(x)
-}
-
-#[inline(always)]
-pub unsafe fn load_i128(x: i128) -> State {
-    let ptr = &x as *const i128 as *const __m128i;
-    let s128 = _mm_loadu_si128(ptr);
-    _mm256_set_m128i(s128, s128)
-}
\ No newline at end of file
diff --git a/src/gxhash/platform/x86_64.rs b/src/gxhash/platform/x86_64.rs
new file mode 100644
index 0000000..ce737b3
--- /dev/null
+++ b/src/gxhash/platform/x86_64.rs
@@ -0,0 +1,215 @@
+use core::arch::x86_64::*;
+
+use super::*;
+
+pub type State = __m128i;
+
+#[inline(always)]
+pub unsafe fn create_empty() -> State {
+    _mm_setzero_si128()
+}
+
+#[inline(always)]
+pub unsafe fn create_seed(seed: i64) -> State {
+    _mm_set1_epi64x(seed)
+}
+
+#[inline(always)]
+pub unsafe fn load_unaligned(p: *const State) -> State {
+    _mm_loadu_si128(p)
+}
+
+#[inline(always)]
+pub unsafe fn get_partial(p: *const State, len: usize) -> State {
+    // Safety check
+    if check_same_page(p) {
+        get_partial_unsafe(p, len)
+    } else {
+        get_partial_safe(p, len)
+    }
+}
+
+#[inline(always)]
+pub unsafe fn get_partial_safe(data: *const State, len: usize) -> State {
+    // Temporary buffer filled with zeros
+    let mut buffer = [0i8; VECTOR_SIZE];
+    // Copy data into the buffer
+    std::ptr::copy(data as *const i8, buffer.as_mut_ptr(), len);
+    // Load the buffer into a __m256i vector
+    let partial_vector = _mm_loadu_si128(buffer.as_ptr() as *const State);
+    _mm_add_epi8(partial_vector, _mm_set1_epi8(len as i8))
+}
+
+#[inline(always)]
+pub unsafe fn get_partial_unsafe(data: *const State, len: usize) -> State {
+    let indices = _mm_set_epi8(15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1, 0);
+    let mask = _mm_cmpgt_epi8(_mm_set1_epi8(len as i8), indices);
+    let partial_vector = _mm_and_si128(_mm_loadu_si128(data), mask);
+    _mm_add_epi8(partial_vector, _mm_set1_epi8(len as i8))
+}
+
+#[inline(always)]
+#[allow(dead_code)]
+pub unsafe fn aes_encrypt(data: State, keys: State) -> State {
+    _mm_aesenc_si128(data, keys)
+}
+
+#[inline(always)]
+#[allow(dead_code)]
+pub unsafe fn aes_encrypt_last(data: State, keys: State) -> State {
+    _mm_aesenclast_si128(data, keys)
+}
+
+#[inline(always)]
+#[allow(dead_code)]
+pub unsafe fn ld(array: *const u32) -> State {
+    _mm_loadu_si128(array as *const State)
+}
+
+#[inline(always)]
+#[allow(overflowing_literals)]
+pub unsafe fn finalize(hash: State) -> State {
+    // Hardcoded AES keys
+    let keys_1 = _mm_set_epi32(0x85459F85, 0xAF163956, 0x8F2F35DB, 0x713B01D0);
+    let keys_2 = _mm_set_epi32(0xB89C054F, 0x3DD99ACA, 0x92CFA39C, 0x1DE09647);
+    let keys_3 = _mm_set_epi32(0xD0012E32, 0x689D2B7D, 0x5544B1B7, 0xC78B122B);
+
+    // 4 rounds of AES
+    let mut hash = _mm_aesenc_si128(hash, keys_1);
+    hash = _mm_aesenc_si128(hash, keys_2);
+    hash = _mm_aesenclast_si128(hash, keys_3);
+
+    hash
+}
+
+#[cfg(not(hybrid))]
+#[inline(always)]
+pub unsafe fn compress_8(mut ptr: *const State, end_address: usize, hash_vector: State, len: usize) -> State {
+
+    // Disambiguation vectors
+    let mut t1: State = create_empty();
+    let mut t2: State = create_empty();
+
+    // Hash is processed in two separate 128-bit parallel lanes
+    // This allows the same processing to be applied using 256-bit V-AES instrinsics
+    // so that hashes are stable in both cases. 
+    let mut lane1 = hash_vector;
+    let mut lane2 = hash_vector;
+
+    while (ptr as usize) < end_address {
+
+        crate::gxhash::load_unaligned!(ptr, v0, v1, v2, v3, v4, v5, v6, v7);
+
+        let mut tmp1 = aes_encrypt(v0, v2);
+        let mut tmp2 = aes_encrypt(v1, v3);
+
+        tmp1 = aes_encrypt(tmp1, v4);
+        tmp2 = aes_encrypt(tmp2, v5);
+
+        tmp1 = aes_encrypt(tmp1, v6);
+        tmp2 = aes_encrypt(tmp2, v7);
+
+        t1 = _mm_add_epi8(t1, ld(KEYS.as_ptr()));
+        t2 = _mm_add_epi8(t2, ld(KEYS.as_ptr().offset(4)));
+
+        lane1 = aes_encrypt_last(aes_encrypt(tmp1, t1), lane1);
+        lane2 = aes_encrypt_last(aes_encrypt(tmp2, t2), lane2);
+    }
+    // For 'Zeroes' test
+    let len_vec =  _mm_set1_epi32(len as i32);
+    lane1 = _mm_add_epi8(lane1, len_vec);
+    lane2 = _mm_add_epi8(lane2, len_vec);
+    // Merge lanes
+    aes_encrypt(lane1, lane2)
+}
+
+#[cfg(hybrid)]
+#[inline(always)]
+pub unsafe fn compress_8(ptr: *const State, end_address: usize, hash_vector: State, len: usize) -> State {
+    macro_rules! load_unaligned_x2 {
+        ($ptr:ident, $($var:ident),+) => {
+            $(
+                #[allow(unused_mut)]
+                let mut $var = _mm256_loadu_si256($ptr);
+                $ptr = ($ptr).offset(1);
+            )+
+        };
+    }
+    
+    let mut ptr = ptr as *const __m256i;
+    let mut t = _mm256_setzero_si256();
+    let mut lane = _mm256_set_m128i(hash_vector, hash_vector);
+    while (ptr as usize) < end_address {
+
+        load_unaligned_x2!(ptr, v0, v1, v2, v3);
+
+        let mut tmp = _mm256_aesenc_epi128(v0, v1);
+        tmp = _mm256_aesenc_epi128(tmp, v2);
+        tmp = _mm256_aesenc_epi128(tmp, v3);
+
+        t = _mm256_add_epi8(t, _mm256_loadu_si256(KEYS.as_ptr() as *const __m256i));
+
+        lane = _mm256_aesenclast_epi128(_mm256_aesenc_epi128(tmp, t), lane);
+    }
+    // Extract the two 128-bit lanes
+    let mut lane1 = _mm256_castsi256_si128(lane);
+    let mut lane2 = _mm256_extracti128_si256(lane, 1);
+    // For 'Zeroes' test
+    let len_vec =  _mm_set1_epi32(len as i32);
+    lane1 = _mm_add_epi8(lane1, len_vec);
+    lane2 = _mm_add_epi8(lane2, len_vec);
+    // Merge lanes
+    aes_encrypt(lane1, lane2)
+}
+
+#[inline(always)]
+pub unsafe fn load_u8(x: u8) -> State {
+    _mm_set1_epi8(x as i8)
+}
+
+#[inline(always)]
+pub unsafe fn load_u16(x: u16) -> State {
+    _mm_set1_epi16(x as i16)
+}
+
+#[inline(always)]
+pub unsafe fn load_u32(x: u32) -> State {
+    _mm_set1_epi32(x as i32)
+}
+
+#[inline(always)]
+pub unsafe fn load_u64(x: u64) -> State {
+    _mm_set1_epi64x(x as i64)
+}
+
+#[inline(always)]
+pub unsafe fn load_u128(x: u128) -> State {
+    let ptr = &x as *const u128 as *const State;
+    _mm_loadu_si128(ptr)
+}
+
+#[inline(always)]
+pub unsafe fn load_i8(x: i8) -> State {
+    _mm_set1_epi8(x)
+}
+
+#[inline(always)]
+pub unsafe fn load_i16(x: i16) -> State {
+    _mm_set1_epi16(x)
+}
+
+#[inline(always)]
+pub unsafe fn load_i32(x: i32) -> State {
+    _mm_set1_epi32(x)
+}
+
+#[inline(always)]
+pub unsafe fn load_i64(x: i64) -> State {
+    _mm_set1_epi64x(x)
+}
+
+#[inline(always)]
+pub unsafe fn load_i128(x: i128) -> State {
+    let ptr = &x as *const i128 as *const State;
+    _mm_loadu_si128(ptr)
+}
\ No newline at end of file
diff --git a/src/hasher.rs b/src/hasher.rs
index 5b82406..2cbc6c7 100644
--- a/src/hasher.rs
+++ b/src/hasher.rs
@@ -98,7 +98,7 @@ macro_rules! write {
         #[inline]
         fn $name(&mut self, value: $type) {
             self.state = unsafe {
-                compress_fast($load(value), self.state)
+                aes_encrypt($load(value), self.state)
             };
         }
     }
@@ -115,7 +115,8 @@ impl Hasher for GxHasher {
 
     #[inline]
     fn write(&mut self, bytes: &[u8]) {
-        self.state = unsafe { compress_fast(compress_all(bytes), self.state) };
+        // Improvement: only compress at this stage and finalize in finish
+        self.state = unsafe { aes_encrypt(compress_all(bytes), self.state) };
     }
 
     write!(write_u8, u8, load_u8);
@@ -181,14 +182,6 @@ mod tests {
         assert!(hashset.insert("bye"));
     }
 
-    #[test]
-    fn hasher_handles_empty_inputs() {
-        let mut hashset = GxHashSet::default();
-        // Getting a ptr from a Vec::<u8>::new() return a pointer with address of 1
-        // We must make sure we dont SIGSEGV in such case
-        assert!(hashset.insert(Vec::<u8>::new()));
-    }
-
     // This is important for DOS resistance
     #[test]
     fn gxhashset_uses_default_gxhasherbuilder() {
diff --git a/src/lib.rs b/src/lib.rs
index 7fd9229..0c54243 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -1,5 +1,5 @@
-// Feature 'avx2' currently requires unstable 'stdsimd'
-#![cfg_attr(all(feature = "avx2", target_arch = "x86_64"), feature(stdsimd))]
+// Hybrid SIMD width usage currently requires unstable 'stdsimd'
+#![cfg_attr(hybrid, feature(stdsimd))]
 
 #[rustfmt::skip]
 mod gxhash;