paritytech · arkpar · Feb 9, 2023 · Feb 9, 2023 · Feb 9, 2023 · Feb 9, 2023
diff --git a/admin/Cargo.toml b/admin/Cargo.toml
@@ -12,6 +12,7 @@ fdlimit = "0.2.1"
 log = "0.4.8"
 parity-db = { path = ".." }
 rand = { version = "0.8.5", features = ["small_rng"] }
+blake2 = "0.10.4"
 
 [target.'cfg(not(target_env = "msvc"))'.dependencies]
 jemallocator = "0.5.0"
diff --git a/admin/src/bench/mod.rs b/admin/src/bench/mod.rs
@@ -76,6 +76,10 @@ pub struct Stress {
 	/// Use btree index.
 	#[clap(long)]
 	pub ordered: bool,
+
+	/// Use uniform keys.
+	#[clap(long)]
+	pub uniform: bool,
 }
 
 #[derive(Clone)]
@@ -90,6 +94,7 @@ pub struct Args {
 	pub no_check: bool,
 	pub compress: bool,
 	pub ordered: bool,
+	pub uniform: bool,
 }
 
 impl Stress {
@@ -105,24 +110,37 @@ impl Stress {
 			no_check: self.no_check,
 			compress: self.compress,
 			ordered: self.ordered,
+			uniform: self.uniform,
 		}
 	}
 }
 
 struct SizePool {
 	distribution: std::collections::BTreeMap<u32, u32>,
 	total: u32,
+	uniform: bool,
+	cache_start: u64,
+	cached_keys: Vec<Key>,
 }
 
 impl SizePool {
-	fn from_histogram(h: &[(u32, u32)]) -> SizePool {
+	fn from_histogram(h: &[(u32, u32)], uniform: bool) -> SizePool {
 		let mut distribution = std::collections::BTreeMap::default();
 		let mut total = 0;
 		for (size, count) in h {
 			total += count;
 			distribution.insert(total, *size);
 		}
-		SizePool { distribution, total }
+		SizePool { distribution, total, uniform, cache_start: 0, cached_keys: Vec::new() }
+	}
+
+	fn cache_keys(&mut self, start: u64, num_keys: u64) {
+		self.cache_start = start;
+		self.cached_keys.clear();
+		for index in self.cache_start..self.cache_start + num_keys {
+			let key_to_cache = self.key(index);
+			self.cached_keys.push(key_to_cache);
+		}
 	}
 
 	fn value(&self, seed: u64, compressable: bool) -> Vec<u8> {
@@ -140,9 +158,34 @@ impl SizePool {
 	}
 
 	fn key(&self, seed: u64) -> Key {
+		use blake2::{
+			digest::{typenum::U32, FixedOutput, Update},
+			Blake2bMac,
+		};
+
+		if seed >= self.cache_start {
+			let key_index = seed - self.cache_start;
+			if key_index < self.cached_keys.len() as u64 {
+				return self.cached_keys[key_index as usize]
+			}
+		}
+
 		let mut rng = rand::rngs::SmallRng::seed_from_u64(seed);
 		let mut key = Key::default();
 		rng.fill_bytes(&mut key);
+
+		if self.uniform {
+			// Just using this to generate uniform keys. Actual salting will still happen inside the
+			// database, even for uniform keys.
+			let salt = [0; 32];
+
+			let mut ctx = Blake2bMac::<U32>::new_with_salt_and_personal(&salt, &[], &[])
+				.expect("Salt length (32) is a valid key length (<= 64)");
+			ctx.update(key.as_ref());
+			let hash = ctx.finalize_fixed();
+			key.copy_from_slice(&hash);
+		}
+
 		key
 	}
 }
@@ -238,9 +281,7 @@ fn iter(db: Arc<Db>, shutdown: Arc<AtomicBool>) {
 pub fn run_internal(args: Args, db: Db) {
 	let args = Arc::new(args);
 	let shutdown = Arc::new(AtomicBool::new(false));
-	let pool = Arc::new(SizePool::from_histogram(sizes::KUSAMA_STATE_DISTRIBUTION));
 	let db = Arc::new(db);
-	let start = std::time::Instant::now();
 
 	let mut threads = Vec::new();
 
@@ -252,6 +293,19 @@ pub fn run_internal(args: Args, db: Db) {
 		0
 	};
 
+	let mut pool = SizePool::from_histogram(sizes::KUSAMA_STATE_DISTRIBUTION, args.uniform);
+	if args.uniform {
+		println!("Generating uniform keys.");
+
+		let offset = args.seed.unwrap_or(0);
+		let start_index = start_commit as u64 * COMMIT_SIZE as u64 + offset;
+		let num_keys = args.commits as u64 * COMMIT_SIZE as u64;
+		pool.cache_keys(start_index, num_keys);
+	}
+	let pool = Arc::new(pool);
+
+	let start = std::time::Instant::now();
+
 	COMMITS.store(start_commit, Ordering::SeqCst);
 	NEXT_COMMIT.store(start_commit, Ordering::SeqCst);
 

diff --git a/admin/src/lib.rs b/admin/src/lib.rs
@@ -120,6 +120,12 @@ pub fn run() -> Result<(), String> {
 					c.compression = parity_db::CompressionType::Lz4;
 				}
 			}
+			if args.uniform {
+				for mut c in &mut db_options.columns {
+					c.uniform = true;
+				}
+			}
+
 			let db = parity_db::Db::open_or_create(&db_options).unwrap();
 			bench::run_internal(args, db);
 		},