Fix default data cache limit validation during eviction (#1779)

renanmagagnin · web-flow · commit 90bb0b4d4f89 · 2026-03-09T16:47:27.000Z
Fixes `is_limit_exceeded()` function used by the data cache when in default mode (which should keep 5% of space in the cache file system). Before the fix, it was incorrectly considering space reserved by the file system as available space leading to 100% space usage. Now, reserved space is considered and the 5% available space is respected. A regression test was also added. ### Does this change impact existing behavior? No ### Does this change need a changelog entry? Does it require a version change? Yes --- By submitting this pull request, I confirm that my contribution is made under the terms of the Apache 2.0 license and I agree to the terms of the [Developer Certificate of Origin (DCO)](https://developercertificate.org/). --------- Signed-off-by: Renan Magagnin <renanmag@amazon.co.uk>
diff --git a/mountpoint-s3-fs/CHANGELOG.md b/mountpoint-s3-fs/CHANGELOG.md
@@ -1,6 +1,7 @@
 ## Unreleased (v0.9.1)
 
 * Upgrade cargo dependencies.
+* Fix incorrect validation of default data cache limit which would cause Mountpoint to preserve less than 5% of available space ([#1779](https://github.com/awslabs/mountpoint-s3/pull/1779))
 
 ## v0.9.0 (January 22, 2026)
 
diff --git a/mountpoint-s3-fs/src/data_cache.rs b/mountpoint-s3-fs/src/data_cache.rs
@@ -15,7 +15,9 @@ use thiserror::Error;
 
 pub use crate::checksums::ChecksummedBytes;
 pub use crate::data_cache::cache_directory::ManagedCacheDir;
-pub use crate::data_cache::disk_data_cache::{CacheLimit, DiskDataCache, DiskDataCacheConfig};
+pub use crate::data_cache::disk_data_cache::{
+    CacheLimit, DEFAULT_CACHE_MIN_AVAILABLE_RATIO, DiskDataCache, DiskDataCacheConfig,
+};
 pub use crate::data_cache::express_data_cache::{ExpressDataCache, ExpressDataCacheConfig, build_prefix, get_s3_key};
 pub use crate::data_cache::in_memory_data_cache::InMemoryDataCache;
 pub use crate::data_cache::multilevel_cache::MultilevelDataCache;
diff --git a/mountpoint-s3-fs/src/data_cache/disk_data_cache.rs b/mountpoint-s3-fs/src/data_cache/disk_data_cache.rs
@@ -62,9 +62,15 @@ pub enum CacheLimit {
     AvailableSpace { min_ratio: f64 },
 }
 
+/// Default minimum ratio of available space to preserve when using AvailableSpace cache limit.
+/// This preserves 5% of the filesystem's total space as available space.
+pub const DEFAULT_CACHE_MIN_AVAILABLE_RATIO: f64 = 0.05;
+
 impl Default for CacheLimit {
     fn default() -> Self {
-        CacheLimit::AvailableSpace { min_ratio: 0.05 } // Preserve 5% available space
+        CacheLimit::AvailableSpace {
+            min_ratio: DEFAULT_CACHE_MIN_AVAILABLE_RATIO,
+        }
     }
 }
 
@@ -407,7 +413,7 @@ impl DiskDataCache {
                         return false;
                     }
                 };
-                (stats.blocks_free() as f64) < min_ratio * (stats.blocks() as f64)
+                (stats.blocks_available() as f64) < min_ratio * (stats.blocks() as f64)
             }
         }
     }
diff --git a/mountpoint-s3-fs/tests/fuse_tests/cache_test.rs b/mountpoint-s3-fs/tests/fuse_tests/cache_test.rs
@@ -1,34 +1,46 @@
 use crate::common::cache::CacheTestWrapper;
-use crate::common::fuse::create_fuse_session;
-use crate::common::fuse::s3_session::create_crt_client;
-use crate::common::s3::{get_test_prefix, get_test_s3_path};
-
-use mountpoint_s3_client::S3CrtClient;
-use mountpoint_s3_fs::Runtime;
-use mountpoint_s3_fs::data_cache::{DataCache, DiskDataCache, DiskDataCacheConfig};
-use mountpoint_s3_fs::fuse::session::FuseSession;
-use mountpoint_s3_fs::memory::PagedPool;
-use mountpoint_s3_fs::object::ObjectId;
-use mountpoint_s3_fs::prefetch::Prefetcher;
-use mountpoint_s3_fs::s3::S3Path;
-
+use crate::common::fuse::{self, TestSessionConfig};
+use mountpoint_s3_fs::data_cache::{CacheLimit, DEFAULT_CACHE_MIN_AVAILABLE_RATIO, DiskDataCache, DiskDataCacheConfig};
 use rand::rngs::SmallRng;
-use rand::{Rng, RngExt, SeedableRng};
-use std::fs;
-use std::time::Duration;
-use tempfile::TempDir;
-use test_case::test_case;
+use rand::{Rng, SeedableRng};
+use std::fs::{self, File};
+use std::io::Read;
+use std::path::{Path, PathBuf};
+use std::process::Command;
+use tracing::{debug, info, warn};
+
+#[cfg(feature = "s3_tests")]
+use {
+    crate::common::fuse::create_fuse_session,
+    crate::common::fuse::s3_session::create_crt_client,
+    crate::common::s3::{get_test_prefix, get_test_s3_path},
+    mountpoint_s3_client::S3CrtClient,
+    mountpoint_s3_fs::Runtime,
+    mountpoint_s3_fs::data_cache::DataCache,
+    mountpoint_s3_fs::fuse::session::FuseSession,
+    mountpoint_s3_fs::memory::PagedPool,
+    mountpoint_s3_fs::object::ObjectId,
+    mountpoint_s3_fs::prefetch::Prefetcher,
+    mountpoint_s3_fs::s3::S3Path,
+    rand::RngExt,
+    std::time::Duration,
+    tempfile::TempDir,
+    test_case::test_case,
+};
+
+#[cfg(feature = "s3express_tests")]
+use {
+    crate::common::s3::{get_express_bucket, get_express_sse_kms_bucket, get_standard_bucket, get_test_kms_key_id},
+    mountpoint_s3_client::ObjectClient,
+    mountpoint_s3_fs::data_cache::{BlockIndex, ExpressDataCache, ExpressDataCacheConfig, build_prefix, get_s3_key},
+};
 
 #[cfg(all(feature = "s3express_tests", feature = "second_account_tests"))]
 use crate::common::s3::{get_bucket_owner, get_external_express_bucket, get_test_endpoint_config};
-#[cfg(feature = "s3express_tests")]
-use crate::common::s3::{get_express_bucket, get_express_sse_kms_bucket, get_standard_bucket, get_test_kms_key_id};
-#[cfg(feature = "s3express_tests")]
-use mountpoint_s3_client::ObjectClient;
-#[cfg(feature = "s3express_tests")]
-use mountpoint_s3_fs::data_cache::{BlockIndex, ExpressDataCache, ExpressDataCacheConfig, build_prefix, get_s3_key};
 
+#[cfg(feature = "s3_tests")]
 const CACHE_BLOCK_SIZE: u64 = 1024 * 1024;
+#[cfg(feature = "s3_tests")]
 const CLIENT_PART_SIZE: usize = 8 * 1024 * 1024;
 
 /// A test that checks that an invalid block may not be served from the cache
@@ -124,6 +136,7 @@ fn express_cache_write_read(key_suffix: &str, key_size: usize, object_size: usiz
 #[test_case("£", 100, 1024; "non-ascii key")]
 #[test_case("key", 1024, 1024; "long key")]
 #[test_case("key", 100, 1024 * 1024; "big file")]
+#[cfg(feature = "s3_tests")]
 fn disk_cache_write_read(key_suffix: &str, key_size: usize, object_size: usize) {
     let cache_dir = tempfile::tempdir().unwrap();
     let cache_config = DiskDataCacheConfig {
@@ -177,6 +190,7 @@ async fn express_cache_read_empty() {
 }
 
 #[tokio::test]
+#[cfg(feature = "s3_tests")]
 async fn disk_cache_read_empty() {
     let cache_dir = tempfile::tempdir().unwrap();
     let cache_config = DiskDataCacheConfig {
@@ -267,6 +281,7 @@ async fn express_cache_verify_fail_forbidden() {
 }
 
 #[allow(clippy::too_many_arguments)]
+#[cfg(feature = "s3_tests")]
 fn cache_write_read_base<Cache>(
     client: S3CrtClient,
     s3_path: S3Path,
@@ -307,6 +322,7 @@ fn cache_write_read_base<Cache>(
     );
 }
 
+#[cfg(feature = "s3_tests")]
 async fn cache_read_empty<Cache>(cache: Cache, test_name: &str)
 where
     Cache: DataCache + Send + Sync + 'static,
@@ -389,6 +405,7 @@ fn express_cache_expected_bucket_owner(cache_bucket: String, owner_checked: bool
 }
 
 /// Generates random data of the specified size
+#[cfg(feature = "s3_tests")]
 fn random_binary_data(size_in_bytes: usize) -> Vec<u8> {
     let seed = rand::rng().random();
     let mut rng = SmallRng::seed_from_u64(seed);
@@ -399,6 +416,7 @@ fn random_binary_data(size_in_bytes: usize) -> Vec<u8> {
 
 /// Creates a random key which has a size of at least `min_size_in_bytes`
 /// The `key_prefix` is not included in the return value.
+#[cfg(feature = "s3_tests")]
 fn get_random_key(key_prefix: &str, key_suffix: &str, min_size_in_bytes: usize) -> String {
     let random_suffix: u64 = rand::rng().random();
     let last_key_part = format!("{key_suffix}{random_suffix}"); // part of the key after all the "/"
@@ -409,6 +427,7 @@ fn get_random_key(key_prefix: &str, key_suffix: &str, min_size_in_bytes: usize)
     format!("{last_key_part}{padding}")
 }
 
+#[cfg(feature = "s3_tests")]
 fn mount_bucket<Cache>(client: S3CrtClient, cache: Cache, pool: PagedPool, s3_path: S3Path) -> (TempDir, FuseSession)
 where
     Cache: DataCache + Send + Sync + 'static,
@@ -428,6 +447,7 @@ where
     (mount_point, session)
 }
 
+#[cfg(feature = "s3_tests")]
 fn get_object_id(prefix: &str, key: &str, etag: &str) -> ObjectId {
     ObjectId::new(format!("{prefix}{key}"), etag.into())
 }
@@ -437,3 +457,199 @@ fn get_express_cache_block_key(bucket: &str, cache_key: &ObjectId, block_idx: Bl
     let block_key_prefix = build_prefix(bucket, CACHE_BLOCK_SIZE);
     get_s3_key(&block_key_prefix, cache_key, block_idx)
 }
+
+/// Get filesystem statistics for a given path
+fn get_filesystem_stats(path: &Path) -> (u64, u64) {
+    let stat = nix::sys::statvfs::statvfs(path).expect("Failed to get filesystem stats");
+    let block_size = stat.block_size();
+    (stat.blocks() * block_size, stat.blocks_available() * block_size)
+}
+
+/// Test that the cache respects the available space limit (default 5% free) during sequential reads.
+///
+/// An isolated loop device filesystem is used for the cache, ensuring Mountpoint calculates the 95% limit based on the isolated filesystem, not the entire host.
+///
+/// Note: requires `sudo` for loop device mount/umount operations.
+#[test]
+fn available_space_cache_limit_test_mock() {
+    const FILE_SIZE: usize = 4 * 1024 * 1024; // 4 MiB per file
+    const NUM_FILES: usize = 50; // 50 files = 200 MiB total data
+    const TOLERANCE_RATIO: f64 = 0.02; // 2% tolerance for filesystem metadata overhead
+    const LOOP_DEVICE_SIZE_MIB: u64 = 128; // 128 MiB loop device - total data (200 MiB) intentionally exceeds this
+
+    let loop_fs = LoopDeviceFilesystem::new(LOOP_DEVICE_SIZE_MIB).expect("Failed to create loop device filesystem");
+    let cache_path = loop_fs.mount_path().to_path_buf();
+
+    let test_session = fuse::mock_session::new_with_cache(|block_size, pool| {
+        let cache_config = DiskDataCacheConfig {
+            cache_directory: cache_path.clone(),
+            block_size,
+            limit: CacheLimit::AvailableSpace {
+                min_ratio: DEFAULT_CACHE_MIN_AVAILABLE_RATIO,
+            },
+        };
+        CacheTestWrapper::new(DiskDataCache::new(cache_config, pool))
+    })("available_space_cache_limit_test", TestSessionConfig::default());
+
+    // Create test files
+    let mut rng = SmallRng::seed_from_u64(0x12345678);
+    let mut file_data = vec![0u8; FILE_SIZE];
+
+    for i in 0..NUM_FILES {
+        rng.fill_bytes(&mut file_data);
+        let key = format!("file-{}.bin", i + 1);
+        test_session.client().put_object(&key, &file_data).unwrap();
+    }
+
+    let (total_space, initial_available) = get_filesystem_stats(&cache_path);
+    let mut min_available_space = initial_available;
+    let mut has_violation = false;
+
+    // Sequential read pattern - read each file once
+    for i in 0..NUM_FILES {
+        let key = format!("file-{}.bin", i + 1);
+        let path = test_session.mount_path().join(&key);
+
+        let mut file = File::open(&path).unwrap();
+        let mut buffer = Vec::new();
+        file.read_to_end(&mut buffer).unwrap();
+
+        assert_eq!(buffer.len(), FILE_SIZE, "File {} has incorrect size", key);
+
+        // Check filesystem available space
+        let (_, current_available) = get_filesystem_stats(&cache_path);
+        min_available_space = min_available_space.min(current_available);
+
+        let available_ratio = current_available as f64 / total_space as f64;
+        let used_percent = ((total_space - current_available) as f64 / total_space as f64) * 100.0;
+
+        // Check if we're preserving at least 5% available space of total filesystem with 2% tolerance.
+        // This margin is necessary because Mountpoint currently slightly exceeds the limit occasionally.
+        let tolerance = (total_space as f64 * TOLERANCE_RATIO) as u64;
+        let min_required_available = (total_space as f64 * DEFAULT_CACHE_MIN_AVAILABLE_RATIO) as u64;
+
+        if current_available < min_required_available.saturating_sub(tolerance) {
+            has_violation = true;
+            let shortage = min_required_available - current_available;
+            let shortage_pct = (shortage as f64 / total_space as f64) * 100.0;
+            warn!(
+                "File {}: Available space {} bytes ({:.1}% used) - BELOW minimum {} bytes (shortage: {} bytes, {:.2}%)",
+                i + 1,
+                current_available,
+                used_percent,
+                min_required_available,
+                shortage,
+                shortage_pct
+            );
+        } else if (i + 1) % 10 == 0 {
+            debug!(
+                "File {}: Used space {} bytes, Available {} bytes ({:.1}% used, {:.1}% free)",
+                i + 1,
+                total_space - current_available,
+                current_available,
+                used_percent,
+                available_ratio * 100.0
+            );
+        }
+    }
+
+    let min_available_space_percent = (min_available_space as f64 / total_space as f64) * 100.0;
+    let (_, final_available) = get_filesystem_stats(&cache_path);
+    let final_used_percent = ((total_space - final_available) as f64 / total_space as f64) * 100.0;
+    info!(
+        "Filesystem Total: {} MiB, Initial available: {} MiB, Min available: {} MiB ({:.1}%), Final usage: {:.1}%",
+        total_space / (1024 * 1024),
+        initial_available / (1024 * 1024),
+        min_available_space / (1024 * 1024),
+        min_available_space_percent,
+        final_used_percent,
+    );
+
+    // Assert that eviction actually triggered - the cache should have gotten close to the limit.
+    let max_expected_available = (total_space as f64 * (DEFAULT_CACHE_MIN_AVAILABLE_RATIO + TOLERANCE_RATIO)) as u64;
+    assert!(
+        min_available_space <= max_expected_available,
+        "Cache eviction may not have triggered - available space never got close to the limit. \
+        Min available: {} bytes ({:.1}%), expected to reach within {:.1}% above the {:.1}% minimum",
+        min_available_space,
+        min_available_space_percent,
+        TOLERANCE_RATIO * 100.0,
+        DEFAULT_CACHE_MIN_AVAILABLE_RATIO * 100.0,
+    );
+
+    // Assert no violations (with the tolerance)
+    assert!(
+        !has_violation,
+        "Cache violated available space limit. Min available: {} bytes ({:.1}%), Required: {:.1}% (tolerance: {:.1}%)",
+        min_available_space,
+        min_available_space_percent,
+        DEFAULT_CACHE_MIN_AVAILABLE_RATIO * 100.0,
+        TOLERANCE_RATIO * 100.0
+    );
+}
+
+/// Represents an isolated loop device filesystem for cache testing
+struct LoopDeviceFilesystem {
+    mount_path: PathBuf,
+    /// Kept alive to ensure the temp directory is not deleted before `Drop` unmounts the loop device.
+    _temp_dir: tempfile::TempDir,
+}
+
+impl LoopDeviceFilesystem {
+    /// Create a new loop device filesystem with the specified size in MiB
+    fn new(size_mib: u64) -> std::io::Result<Self> {
+        let temp_dir = tempfile::tempdir()?;
+        let image_path = temp_dir.path().join("cache-device.img");
+        let mount_path = temp_dir.path().join("cache-mount");
+
+        fs::create_dir_all(&mount_path)?;
+
+        // Create a sparse file for the loop device
+        let file = File::create(&image_path)?;
+        file.set_len(size_mib * 1024 * 1024)?;
+        drop(file);
+
+        // Create ext4 filesystem on the image
+        let output = Command::new("mkfs.ext4").arg("-F").arg(&image_path).output()?;
+        if !output.status.success() {
+            return Err(std::io::Error::other(format!(
+                "mkfs.ext4 failed: {}",
+                String::from_utf8_lossy(&output.stderr)
+            )));
+        }
+
+        let output = Command::new("sudo")
+            .args(["mount", "-o", "loop"])
+            .arg(&image_path)
+            .arg(&mount_path)
+            .output()?;
+        if !output.status.success() {
+            return Err(std::io::Error::other(format!(
+                "mount failed: {}",
+                String::from_utf8_lossy(&output.stderr)
+            )));
+        }
+
+        // Make the mount point writable
+        let output = Command::new("sudo").args(["chmod", "777"]).arg(&mount_path).output()?;
+        if !output.status.success() {
+            warn!("chmod failed: {}", String::from_utf8_lossy(&output.stderr));
+        }
+
+        Ok(Self {
+            mount_path,
+            _temp_dir: temp_dir,
+        })
+    }
+
+    /// Get the mount path for the loop device
+    fn mount_path(&self) -> &Path {
+        &self.mount_path
+    }
+}
+
+impl Drop for LoopDeviceFilesystem {
+    fn drop(&mut self) {
+        let _ = Command::new("sudo").arg("umount").arg(&self.mount_path).output();
+    }
+}
diff --git a/mountpoint-s3-fs/tests/fuse_tests/mod.rs b/mountpoint-s3-fs/tests/fuse_tests/mod.rs
@@ -1,4 +1,3 @@
-#[cfg(feature = "s3_tests")]
 mod cache_test;
 mod consistency_test;
 #[cfg(all(feature = "manifest", feature = "event_log"))]
diff --git a/mountpoint-s3/CHANGELOG.md b/mountpoint-s3/CHANGELOG.md
@@ -1,6 +1,7 @@
 ## Unreleased (v1.22.1)
 
 * Upgrade cargo dependencies.
+* Fix incorrect validation of default data cache limit which would cause Mountpoint to preserve less than 5% of available space ([#1779](https://github.com/awslabs/mountpoint-s3/pull/1779))
 
 ## v1.22.0 (January 22, 2026)
 

Original file line number	Diff line number	Diff line change
`@@ -62,9 +62,15 @@ pub enum CacheLimit {`
`62`	`62`	`AvailableSpace { min_ratio: f64 },`
`63`	`63`	`}`
`64`	`64`
	`65`	`+/// Default minimum ratio of available space to preserve when using AvailableSpace cache limit.`
	`66`	`+/// This preserves 5% of the filesystem's total space as available space.`
	`67`	`+pub const DEFAULT_CACHE_MIN_AVAILABLE_RATIO: f64 = 0.05;`
	`68`	`+`
`65`	`69`	`impl Default for CacheLimit {`
`66`	`70`	`fn default() -> Self {`
`67`		`- CacheLimit::AvailableSpace { min_ratio: 0.05 } // Preserve 5% available space`
	`71`	`+ CacheLimit::AvailableSpace {`
	`72`	`+ min_ratio: DEFAULT_CACHE_MIN_AVAILABLE_RATIO,`
	`73`	`+ }`
`68`	`74`	`}`
`69`	`75`	`}`
`70`	`76`
`@@ -407,7 +413,7 @@ impl DiskDataCache {`
`407`	`413`	`return false;`
`408`	`414`	`}`
`409`	`415`	`};`
`410`		`- (stats.blocks_free() as f64) < min_ratio * (stats.blocks() as f64)`
	`416`	`+ (stats.blocks_available() as f64) < min_ratio * (stats.blocks() as f64)`
`411`	`417`	`}`
`412`	`418`	`}`
`413`	`419`	`}`
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,3 @@`
`1`		`-#[cfg(feature = "s3_tests")]`
`2`	`1`	`mod cache_test;`
`3`	`2`	`mod consistency_test;`
`4`	`3`	`#[cfg(all(feature = "manifest", feature = "event_log"))]`