test(core): quality audit — 18 new tests, fix stale docs, harden .gitignore

claude · claude · commit a12c25677d85 · 2026-03-16T07:14:44.000Z
Add 18 new tests covering previously untested paths: - Config validation edge cases (9 should_panic tests for all validate() branches) - Block boundary matrix tests across 3 configurations (block/full AttnRes) - Block accumulation count verification through full forward pass - Numerical stability: large magnitude, near-zero, and zero inputs - RMSNorm zero-input safety (eps prevents NaN) - Two-phase stress tests: deep model (24 sublayers) and Full AttnRes mode - Property tests: identical-source identity, output finiteness Fix stale documentation: - README: update from v0.1.0/57 tests to v0.2.0/84 tests, remove false "no serialization" claim, add actual current limitations - AGENTS.md: fix incorrect "SwiGLU-style MLP" → "GELU activation" - ROADMAP.md: update current phase from v0.1.0 to v0.2.0 Harden .gitignore with IDE files, OS files, model checkpoint artifacts. 84 tests passing. Clippy clean. Fmt clean. https://claude.ai/code/session_017JX3N9cDig1WYJG5P1rdVy
diff --git a/.gitignore b/.gitignore
@@ -17,9 +17,22 @@ target
 # Contains mutation testing data
 **/mutants.out*/
 
-# RustRover
-#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
-#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
-#  and can be added to the global gitignore or merged into this file.  For a more nuclear
-#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
-#.idea/
+# IDE / Editor files
+.idea/
+.vscode/
+*.swp
+*.swo
+*~
+
+# OS files
+.DS_Store
+Thumbs.db
+
+# Model checkpoint artifacts
+*.mpk
+*.bin
+*.onnx
+*.safetensors
+
+# Criterion benchmark output
+target/criterion/
diff --git a/AGENTS.md b/AGENTS.md
@@ -29,7 +29,7 @@ src/
 ├── serialization.rs    # Model weight save/load (NamedMpk, binary, compact formats)
 ├── two_phase.rs        # Two-phase inference primitives (phase1_batched, online_softmax_merge)
 ├── attention.rs        # Multi-head self-attention
-├── feed_forward.rs     # SwiGLU-style MLP
+├── feed_forward.rs     # Two-layer MLP with GELU activation
 └── utils.rs            # Causal mask generation helpers
 
 tests/
@@ -55,7 +55,7 @@ fixtures/                # Reference outputs from PyTorch
 
 ```bash
 cargo build                        # Build the project
-cargo test --all-features          # Run all 66 tests
+cargo test --all-features          # Run all 84 tests
 cargo test test_name               # Run specific test
 cargo clippy -- -D warnings        # Lint (warnings = errors)
 cargo fmt                          # Format code
diff --git a/README.md b/README.md
@@ -83,13 +83,13 @@ cargo bench                        # Benchmarks
 
 ## Current Status
 
-**Alpha** (v0.1.0). Core algorithm implemented and tested with 57 passing tests (unit, differential, property-based, integration). Built on burn 0.20. Suitable for research and experimentation. Not yet suitable for production training at scale.
+**Alpha** (v0.2.0). Core algorithm implemented and tested with 84 passing tests (unit, differential, property-based, integration, doctest). Built on burn 0.20. Serialization (NamedMpk, binary, compact/half-precision) and two-phase inference integrated. Suitable for research and experimentation. Not yet suitable for production training at scale.
 
 Known limitations:
-- No weight serialization/loading (safetensors support planned)
-- Two-phase inference optimization is implemented but not integrated into the main forward pass
+- No PyTorch checkpoint import (safetensors format)
 - NdArray backend only tested; GPU backends (wgpu, CUDA, Metal) untested
 - No distributed training support
+- No KV-cache for autoregressive generation
 
 See [ROADMAP.md](ROADMAP.md) for planned features and progress.
 
diff --git a/ROADMAP.md b/ROADMAP.md
@@ -1,8 +1,8 @@
 # attnres-rs Roadmap
 
-## Current Phase: Alpha (v0.1.0)
+## Current Phase: Alpha (v0.2.0)
 
-Core algorithm implemented and tested. Suitable for research and experimentation.
+Core algorithm, serialization, and two-phase inference implemented. 84 tests passing. Suitable for research and experimentation.
 
 ---
 
@@ -29,7 +29,7 @@ Core algorithm implemented and tested. Suitable for research and experimentation
 - [x] Config save/load (JSON via burn's Config trait)
 - [x] Integrate two-phase inference into main `forward_two_phase` method
 - [x] Layer accessor methods for two-phase inference components
-- [x] 66 tests passing (unit, differential, property-based, integration, doctest)
+- [x] 84 tests passing (unit, differential, property-based, integration, doctest)
 - [ ] Pre-trained weight loading from PyTorch checkpoints
 - [ ] Model export utilities
 
diff --git a/tests/property_tests.rs b/tests/property_tests.rs
@@ -102,4 +102,68 @@ proptest! {
         let output = op.forward(&blocks, &partial);
         prop_assert_eq!(output.dims(), [batch, seq_len, d_model]);
     }
+
+    /// Zero-init AttnRes with identical sources should return that source.
+    /// This is the identity property: if all inputs are the same, the output
+    /// must equal that input regardless of num_blocks.
+    #[test]
+    fn identical_sources_produce_identical_output(
+        num_blocks in 1_usize..5,
+        batch in 1_usize..3,
+        seq_len in 1_usize..5,
+    ) {
+        let d_model = 16;
+        let device = Default::default();
+        let config = AttnResConfig::new(d_model, 12, num_blocks);
+        let op = config.init_op::<TestBackend>(&device);
+
+        // All sources are the same tensor
+        let source = Tensor::random(
+            [batch, seq_len, d_model],
+            Distribution::Uniform(-1.0, 1.0),
+            &device,
+        );
+        let blocks: Vec<_> = (0..num_blocks).map(|_| source.clone()).collect();
+
+        let output = op.forward(&blocks, &source);
+        let diff: f32 = (output - source).abs().max().into_scalar();
+        prop_assert!(
+            diff < 1e-3,
+            "Identical sources should produce that source, diff={diff}"
+        );
+    }
+
+    /// AttnRes output should be finite (no NaN/Inf) for any reasonable input.
+    #[test]
+    fn output_is_always_finite(
+        num_blocks in 1_usize..4,
+        batch in 1_usize..3,
+        seq_len in 1_usize..5,
+    ) {
+        let d_model = 16;
+        let device = Default::default();
+        let config = AttnResConfig::new(d_model, 12, num_blocks);
+        let op = config.init_op::<TestBackend>(&device);
+
+        let blocks: Vec<_> = (0..num_blocks)
+            .map(|_| {
+                Tensor::random(
+                    [batch, seq_len, d_model],
+                    Distribution::Uniform(-10.0, 10.0),
+                    &device,
+                )
+            })
+            .collect();
+        let partial = Tensor::random(
+            [batch, seq_len, d_model],
+            Distribution::Uniform(-10.0, 10.0),
+            &device,
+        );
+
+        let output = op.forward(&blocks, &partial);
+        let has_nan: bool = output.clone().is_nan().any().into_scalar();
+        let has_inf: bool = output.is_inf().any().into_scalar();
+        prop_assert!(!has_nan, "Output contains NaN");
+        prop_assert!(!has_inf, "Output contains Inf");
+    }
 }
diff --git a/tests/unit_tests.rs b/tests/unit_tests.rs