up

jedisct1 · jedisct1 · commit 5f07d97ff84d · 2025-05-14T01:27:01.000+02:00
diff --git a/Cargo.toml b/Cargo.toml
@@ -1,25 +1,47 @@
 [package]
 name = "sieve-cache"
-version = "0.2.1"
+version = "1.0.0"
 edition = "2021"
-description = "SIEVE cache replacement policy"
+description = "SIEVE cache replacement policy with thread-safe wrappers"
 homepage = "https://github.com/jedisct1/rust-sieve-cache"
 repository = "https://github.com/jedisct1/rust-sieve-cache"
-keywords = ["cache", "replacement", "sieve"]
+documentation = "https://docs.rs/sieve-cache"
+keywords = ["cache", "replacement", "sieve", "thread-safe", "concurrent"]
 license = "MIT"
 authors = ["Frank Denis <github@pureftpd.org>"]
-categories = ["algorithms", "caching"]
+categories = ["algorithms", "caching", "concurrency", "data-structures"]
 readme = "README.md"
+rust-version = "1.60.0"
+
+[features]
+default = ["sync", "sharded"]
+sync = []
+sharded = []
+doctest = ["sync", "sharded"]
+
+[dependencies]
 
 [dev-dependencies]
-criterion = "0.5"
+criterion = { version = "0.5", features = ["html_reports"] }
 rand = "0.9.0"
 rand_distr = "0.5.1"
 
 [[bench]]
 name = "criterion"
 harness = false
 
+[package.metadata.docs.rs]
+all-features = true
+rustdoc-args = ["--cfg", "docsrs"]
+
 [profile.release]
 panic = "abort"
 opt-level = 3
+lto = true
+codegen-units = 1
+strip = true
+
+[profile.bench]
+opt-level = 3
+debug = true
+lto = "thin"
diff --git a/README.md b/README.md
@@ -67,6 +67,10 @@ let evicted = cache.evict();  // Returns and removes a value that wasn't recentl
 
 ## Thread-Safe Implementations
 
+These implementations are available when using the appropriate feature flags:
+- `SyncSieveCache` is available with the `sync` feature (enabled by default)
+- `ShardedSieveCache` is available with the `sharded` feature (enabled by default)
+
 ### `SyncSieveCache` - Basic Thread-Safe Cache
 
 For concurrent access from multiple threads, you can use the `SyncSieveCache` wrapper, which provides thread safety with a single global lock:
@@ -190,6 +194,29 @@ The `ShardedSieveCache` divides the cache into multiple independent segments (sh
 
 This design significantly reduces lock contention when operations are distributed across different keys, making it ideal for high-concurrency workloads.
 
+## Feature Flags
+
+This crate provides the following feature flags to control which implementations are available:
+
+- `sync`: Enables the thread-safe `SyncSieveCache` implementation (enabled by default)
+- `sharded`: Enables the sharded `ShardedSieveCache` implementation (enabled by default)
+
+If you only need specific implementations, you can select just the features you need:
+
+```toml
+# Only use the core implementation
+sieve-cache = { version = "1.0.0", default-features = false }
+
+# Only use the core and sync implementations
+sieve-cache = { version = "1.0.0", default-features = false, features = ["sync"] }
+
+# Only use the core and sharded implementations
+sieve-cache = { version = "1.0.0", default-features = false, features = ["sharded"] }
+
+# For documentation tests to work correctly
+sieve-cache = { version = "1.0.0", features = ["doctest"] }
+```
+
 ## Performance Considerations
 
 Choosing the right cache implementation depends on your workload:
diff --git a/benches/criterion.rs b/benches/criterion.rs
@@ -4,10 +4,16 @@ extern crate criterion;
 use criterion::{black_box, BatchSize, Criterion};
 use rand::prelude::*;
 use rand_distr::{Distribution, Normal};
-use sieve_cache::{ShardedSieveCache, SieveCache, SyncSieveCache};
+use sieve_cache::SieveCache;
 use std::sync::Arc;
 use std::thread;
 
+#[cfg(feature = "sync")]
+use sieve_cache::SyncSieveCache;
+
+#[cfg(feature = "sharded")]
+use sieve_cache::ShardedSieveCache;
+
 /// Benchmark sequential access patterns with the base SieveCache implementation.
 ///
 /// This benchmark measures the performance of sequential insert and get operations
@@ -108,146 +114,162 @@ fn bench_composite_normal(c: &mut Criterion) {
     });
 }
 
-/// Benchmark comparing different thread-safe cache implementations in a high-concurrency scenario.
-///
-/// This benchmark measures the performance difference between:
-/// 1. SyncSieveCache - using a single mutex for the entire cache
-/// 2. ShardedSieveCache - using multiple mutexes (default 16 shards)
-/// 3. ShardedSieveCache with 32 shards - higher shard count
-///
-/// The test simulates multiple threads performing random operations (inserts and lookups)
-/// concurrently, which should highlight the benefits of the sharded approach in
-/// reducing lock contention.
-fn bench_concurrent_access(c: &mut Criterion) {
-    let mut group = c.benchmark_group("concurrent_access");
-    group.sample_size(10); // Reduce sample size for these expensive benchmarks
-
-    // Set up benchmark parameters
-    const CACHE_SIZE: usize = 10000;
-    const NUM_THREADS: usize = 8;
-    const OPS_PER_THREAD: usize = 1000;
-
-    // Generic benchmark function to reduce code duplication
-    let run_concurrent_benchmark = |cache: Arc<dyn CacheInterface<u64, u64>>| {
-        let mut handles = Vec::with_capacity(NUM_THREADS);
-
-        for thread_id in 0..NUM_THREADS {
-            let cache_clone = Arc::clone(&cache);
-            let handle = thread::spawn(move || {
-                // Use a seeded RNG for reproducibility, with different seeds per thread
-                let mut rng = StdRng::seed_from_u64(thread_id as u64);
-
-                for i in 0..OPS_PER_THREAD {
-                    // Use a key range that creates some contention but also some distribution
-                    let key = rng.random_range(0..1000);
-
-                    // Mix operations: 40% inserts, 60% reads
-                    if i % 10 < 4 {
-                        black_box(cache_clone.insert(key, key));
-                    } else {
-                        black_box(cache_clone.get(&key));
-                    }
-                }
-            });
-            handles.push(handle);
-        }
+// Interface trait to allow treating both cache implementations uniformly
+trait CacheInterface<K, V>: Send + Sync {
+    fn insert(&self, key: K, value: V) -> bool;
+    fn get(&self, key: &K) -> Option<V>;
+}
 
-        for handle in handles {
-            handle.join().unwrap();
-        }
-    };
+// Only compile concurrent benchmark when both thread-safe implementations are available
+#[cfg(all(feature = "sync", feature = "sharded"))]
+mod concurrent_benchmarks {
+    use super::*;
 
-    // Benchmark with SyncSieveCache (single mutex)
-    group.bench_function("sync_cache", |b| {
-        b.iter_batched(
-            || {
-                // Setup for each iteration
-                Arc::new(SyncSieveCacheAdapter(
-                    SyncSieveCache::new(CACHE_SIZE).unwrap(),
-                ))
-            },
-            |cache| run_concurrent_benchmark(cache),
-            BatchSize::SmallInput,
-        );
-    });
+    /// Benchmark comparing different thread-safe cache implementations in a high-concurrency scenario.
+    ///
+    /// This benchmark measures the performance difference between:
+    /// 1. SyncSieveCache - using a single mutex for the entire cache
+    /// 2. ShardedSieveCache - using multiple mutexes (default 16 shards)
+    /// 3. ShardedSieveCache with 32 shards - higher shard count
+    ///
+    /// The test simulates multiple threads performing random operations (inserts and lookups)
+    /// concurrently, which should highlight the benefits of the sharded approach in
+    /// reducing lock contention.
+    pub fn bench_concurrent_access(c: &mut Criterion) {
+        let mut group = c.benchmark_group("concurrent_access");
+        group.sample_size(10); // Reduce sample size for these expensive benchmarks
 
-    // Benchmark with ShardedSieveCache (default: 16 mutexes)
-    group.bench_function("sharded_cache_16_shards", |b| {
-        b.iter_batched(
-            || {
-                // Setup for each iteration
-                Arc::new(ShardedSieveCacheAdapter(
-                    ShardedSieveCache::new(CACHE_SIZE).unwrap(),
-                ))
-            },
-            |cache| run_concurrent_benchmark(cache),
-            BatchSize::SmallInput,
-        );
-    });
+        // Set up benchmark parameters
+        const CACHE_SIZE: usize = 10000;
+        const NUM_THREADS: usize = 8;
+        const OPS_PER_THREAD: usize = 1000;
 
-    // Benchmark with different shard counts
-    group.bench_function("sharded_cache_32_shards", |b| {
-        b.iter_batched(
-            || {
-                // Setup for each iteration
-                Arc::new(ShardedSieveCacheAdapter(
-                    ShardedSieveCache::with_shards(CACHE_SIZE, 32).unwrap(),
-                ))
-            },
-            |cache| run_concurrent_benchmark(cache),
-            BatchSize::SmallInput,
-        );
-    });
+        // Generic benchmark function to reduce code duplication
+        let run_concurrent_benchmark = |cache: Arc<dyn CacheInterface<u64, u64>>| {
+            let mut handles = Vec::with_capacity(NUM_THREADS);
 
-    group.finish();
-}
+            for thread_id in 0..NUM_THREADS {
+                let cache_clone = Arc::clone(&cache);
+                let handle = thread::spawn(move || {
+                    // Use a seeded RNG for reproducibility, with different seeds per thread
+                    let mut rng = StdRng::seed_from_u64(thread_id as u64);
 
-// Interface trait to allow treating both cache implementations uniformly
-trait CacheInterface<K, V>: Send + Sync {
-    fn insert(&self, key: K, value: V) -> bool;
-    fn get(&self, key: &K) -> Option<V>;
-}
+                    for i in 0..OPS_PER_THREAD {
+                        // Use a key range that creates some contention but also some distribution
+                        let key = rng.random_range(0..1000);
 
-// Adapter for SyncSieveCache
-struct SyncSieveCacheAdapter<K: Eq + std::hash::Hash + Clone + Send + Sync, V: Clone + Send + Sync>(
-    SyncSieveCache<K, V>,
-);
+                        // Mix operations: 40% inserts, 60% reads
+                        if i % 10 < 4 {
+                            black_box(cache_clone.insert(key, key));
+                        } else {
+                            black_box(cache_clone.get(&key));
+                        }
+                    }
+                });
+                handles.push(handle);
+            }
 
-impl<K: Eq + std::hash::Hash + Clone + Send + Sync, V: Clone + Send + Sync> CacheInterface<K, V>
-    for SyncSieveCacheAdapter<K, V>
-{
-    fn insert(&self, key: K, value: V) -> bool {
-        self.0.insert(key, value)
-    }
+            for handle in handles {
+                handle.join().unwrap();
+            }
+        };
+
+        // Benchmark with SyncSieveCache (single mutex)
+        group.bench_function("sync_cache", |b| {
+            b.iter_batched(
+                || {
+                    // Setup for each iteration
+                    Arc::new(SyncSieveCacheAdapter(
+                        SyncSieveCache::new(CACHE_SIZE).unwrap(),
+                    ))
+                },
+                |cache| run_concurrent_benchmark(cache),
+                BatchSize::SmallInput,
+            );
+        });
+
+        // Benchmark with ShardedSieveCache (default: 16 mutexes)
+        group.bench_function("sharded_cache_16_shards", |b| {
+            b.iter_batched(
+                || {
+                    // Setup for each iteration
+                    Arc::new(ShardedSieveCacheAdapter(
+                        ShardedSieveCache::new(CACHE_SIZE).unwrap(),
+                    ))
+                },
+                |cache| run_concurrent_benchmark(cache),
+                BatchSize::SmallInput,
+            );
+        });
 
-    fn get(&self, key: &K) -> Option<V> {
-        self.0.get(key)
+        // Benchmark with different shard counts
+        group.bench_function("sharded_cache_32_shards", |b| {
+            b.iter_batched(
+                || {
+                    // Setup for each iteration
+                    Arc::new(ShardedSieveCacheAdapter(
+                        ShardedSieveCache::with_shards(CACHE_SIZE, 32).unwrap(),
+                    ))
+                },
+                |cache| run_concurrent_benchmark(cache),
+                BatchSize::SmallInput,
+            );
+        });
+
+        group.finish();
     }
-}
 
-// Adapter for ShardedSieveCache
-struct ShardedSieveCacheAdapter<
-    K: Eq + std::hash::Hash + Clone + Send + Sync,
-    V: Clone + Send + Sync,
->(ShardedSieveCache<K, V>);
-
-impl<K: Eq + std::hash::Hash + Clone + Send + Sync, V: Clone + Send + Sync> CacheInterface<K, V>
-    for ShardedSieveCacheAdapter<K, V>
-{
-    fn insert(&self, key: K, value: V) -> bool {
-        self.0.insert(key, value)
+    // Adapter for SyncSieveCache
+    struct SyncSieveCacheAdapter<K: Eq + std::hash::Hash + Clone + Send + Sync, V: Clone + Send + Sync>(
+        SyncSieveCache<K, V>,
+    );
+
+    impl<K: Eq + std::hash::Hash + Clone + Send + Sync, V: Clone + Send + Sync> CacheInterface<K, V>
+        for SyncSieveCacheAdapter<K, V>
+    {
+        fn insert(&self, key: K, value: V) -> bool {
+            self.0.insert(key, value)
+        }
+
+        fn get(&self, key: &K) -> Option<V> {
+            self.0.get(key)
+        }
     }
 
-    fn get(&self, key: &K) -> Option<V> {
-        self.0.get(key)
+    // Adapter for ShardedSieveCache
+    struct ShardedSieveCacheAdapter<
+        K: Eq + std::hash::Hash + Clone + Send + Sync,
+        V: Clone + Send + Sync,
+    >(ShardedSieveCache<K, V>);
+
+    impl<K: Eq + std::hash::Hash + Clone + Send + Sync, V: Clone + Send + Sync> CacheInterface<K, V>
+        for ShardedSieveCacheAdapter<K, V>
+    {
+        fn insert(&self, key: K, value: V) -> bool {
+            self.0.insert(key, value)
+        }
+
+        fn get(&self, key: &K) -> Option<V> {
+            self.0.get(key)
+        }
     }
 }
 
+#[cfg(all(feature = "sync", feature = "sharded"))]
 criterion_group!(
     benches,
     bench_sequence,
     bench_composite,
     bench_composite_normal,
-    bench_concurrent_access
+    concurrent_benchmarks::bench_concurrent_access
 );
+
+#[cfg(not(all(feature = "sync", feature = "sharded")))]
+criterion_group!(
+    benches,
+    bench_sequence,
+    bench_composite,
+    bench_composite_normal
+);
+
 criterion_main!(benches);
diff --git a/src/lib.rs b/src/lib.rs