feat!: use Arinae as default algorithm

LoricAndre · LoricAndre · commit 5b0323a9fb54 · 2026-03-10T15:59:59.000+01:00
=== Results: ./target/release/sk [baseline] ===
Completed runs: 50 / 50
Average items matched: 2895782 / 10000000  (min: 2895782, max: 2895782)
Average time: 3.827s  (min: 3.576s, max: 4.090s)
Average items/second: 2615767  (min: 2445033, max: 2796365)
Average peak memory usage: 1589.2 MB  (min: 1518.6 MB, max: 1661.2 MB)
Average peak CPU usage: 528.9%  (min: 457.0%, max: 740.0%)

=== Results: /home/loric/.local/share/cargo/bin/sk ===
Completed runs: 50 / 50
Average items matched: 2895782 / 10000000  (min: 2895782, max: 2895782)
+0.0%
Average time: 3.930s  (min: 3.565s, max: 4.226s)  +2.7%
Average items/second: 2548674  (min: 2366263, max: 2804816)  -2.6%
Average peak memory usage: 1618.8 MB  (min: 1539.1 MB, max: 1680.6 MB)
+1.9%
Average peak CPU usage: 696.8%  (min: 608.0%, max: 875.0%)  +31.7%

=== Results: /home/loric/.nix-profile/bin/fzf ===
Completed runs: 50 / 50
Average items matched: 2895782 / 10000000  (min: 2895782, max: 2895782)
+0.0%
Average time: 5.421s  (min: 4.814s, max: 6.111s)  +41.7%
Average items/second: 1848269  (min: 1636444, max: 2077385)  -29.3%
Average peak memory usage: 2015.3 MB  (min: 1860.7 MB, max: 2173.9 MB)
+26.8%
Average peak CPU usage: 1301.1%  (min: 1229.0%, max: 1431.0%)  +146.0%

=== Comparison Summary (vs baseline: ./target/release/sk) ===
Binary                                       Avg time     Δ time
Avg rate     Δ rate
------------------------------------------------------------------------------------------
./target/release/sk                            3.827s   baseline
2615767   baseline
/home/loric/.local/share/cargo/bin/sk          3.930s      +2.7%
2548674      -2.6%
/home/loric/.nix-profile/bin/fzf               5.421s     +41.7%
1848269     -29.3%
diff --git a/src/engine/fuzzy.rs b/src/engine/fuzzy.rs
@@ -17,19 +17,17 @@ use crate::{MatchRange, MatchResult, SkimItem};
 #[cfg_attr(feature = "cli", derive(clap::ValueEnum))]
 #[cfg_attr(feature = "cli", clap(rename_all = "snake_case"))]
 pub enum FuzzyAlgorithm {
-    /// Original skim fuzzy matching algorithm (v1)
-    SkimV1,
-    /// Improved skim fuzzy matching algorithm (v2, default)
-    #[default]
+    /// Improved skim fuzzy matching algorithm (v2)
     SkimV2,
     /// Clangd fuzzy matching algorithm
     Clangd,
     /// Fzy matching algorithm (https://github.com/jhawthorn/fzy)
     Fzy,
     /// Frizbee matching algorithm, typo resistant
     Frizbee,
-    /// Arinae: typo-resistant & natural algorithm
+    /// Arinae: typo-resistant & natural algorithm, default
     #[cfg_attr(feature = "cli", clap(alias = "ari"))]
+    #[default]
     Arinae,
 }
 
@@ -107,15 +105,10 @@ impl FuzzyEngineBuilder {
 
     #[allow(deprecated)]
     pub fn build(self) -> FuzzyEngine {
-        use crate::fuzzy_matcher::skim::SkimMatcher;
         #[allow(unused_mut)]
         let mut algorithm = self.algorithm;
         let max_typos = self.effective_max_typos();
         let matcher: Box<dyn FuzzyMatcher> = match algorithm {
-            FuzzyAlgorithm::SkimV1 => {
-                debug!("Initialized SkimV1 algorithm");
-                Box::new(SkimMatcher::default())
-            }
             FuzzyAlgorithm::SkimV2 => {
                 let matcher = SkimMatcherV2::default().element_limit(BYTES_1M);
                 let matcher = match self.case {
diff --git a/src/fuzzy_matcher/arinae/atom.rs b/src/fuzzy_matcher/arinae/atom.rs
@@ -85,6 +85,6 @@ impl Atom for char {
     }
     #[inline(always)]
     fn is_lowercase(self) -> bool {
-        self.is_ascii_lowercase()
+        self.is_lowercase()
     }
 }
diff --git a/src/fuzzy_matcher/skim.rs b/src/fuzzy_matcher/skim.rs
@@ -26,243 +26,6 @@ use super::skim::Movement::{Match, Skip};
 use super::util::{char_equal, cheap_matches};
 use super::{FuzzyMatcher, IndexType, MatchIndices, ScoreType};
 
-const BONUS_MATCHED: ScoreType = 4;
-const BONUS_CASE_MATCH: ScoreType = 4;
-const BONUS_UPPER_MATCH: ScoreType = 6;
-const BONUS_ADJACENCY: ScoreType = 10;
-const BONUS_SEPARATOR: ScoreType = 8;
-const BONUS_CAMEL: ScoreType = 8;
-const PENALTY_CASE_UNMATCHED: ScoreType = -1;
-const PENALTY_LEADING: ScoreType = -6;
-// penalty applied for every letter before the first match
-const PENALTY_MAX_LEADING: ScoreType = -18;
-// maxing penalty for leading letters
-const PENALTY_UNMATCHED: ScoreType = -2;
-
-#[deprecated(since = "0.3.5", note = "Please use SkimMatcherV2 instead")]
-/// Legacy fuzzy matcher (V1) - deprecated, use SkimMatcherV2 instead
-#[derive(Default, Debug)]
-pub struct SkimMatcher {}
-
-/// The V1 matcher is based on ForrestTheWoods's post
-/// https://www.forrestthewoods.com/blog/reverse_engineering_sublime_texts_fuzzy_match/
-///
-/// V1 algorithm is deprecated, checkout `FuzzyMatcherV2`
-impl FuzzyMatcher for SkimMatcher {
-    fn fuzzy_indices(&self, choice: &str, pattern: &str) -> Option<(ScoreType, MatchIndices)> {
-        fuzzy_indices(choice, pattern).map(|(s, v)| (s, MatchIndices::from(v)))
-    }
-
-    fn fuzzy_match(&self, choice: &str, pattern: &str) -> Option<ScoreType> {
-        fuzzy_match(choice, pattern)
-    }
-}
-
-#[deprecated(since = "0.3.5", note = "Please use SkimMatcherV2 instead")]
-/// Legacy fuzzy matching function - returns match score only
-pub fn fuzzy_match(choice: &str, pattern: &str) -> Option<ScoreType> {
-    if pattern.is_empty() {
-        return Some(0);
-    }
-
-    let scores = build_graph(choice, pattern)?;
-
-    let last_row = &scores[scores.len() - 1];
-    let (_, &MatchingStatus { final_score, .. }) = last_row
-        .iter()
-        .enumerate()
-        .max_by_key(|&(_, x)| x.final_score)
-        .expect("fuzzy_indices failed to iterate over last_row");
-    Some(final_score)
-}
-
-#[deprecated(since = "0.3.5", note = "Please use SkimMatcherV2 instead")]
-/// Legacy fuzzy matching function - returns match score and character indices
-pub fn fuzzy_indices(choice: &str, pattern: &str) -> Option<(ScoreType, Vec<IndexType>)> {
-    if pattern.is_empty() {
-        return Some((0, Vec::new()));
-    }
-
-    let mut picked = vec![];
-    let scores = build_graph(choice, pattern)?;
-
-    let last_row = &scores[scores.len() - 1];
-    let (mut next_col, &MatchingStatus { final_score, .. }) = last_row
-        .iter()
-        .enumerate()
-        .max_by_key(|&(_, x)| x.final_score)
-        .expect("fuzzy_indices failed to iterate over last_row");
-    let mut pat_idx = scores.len() as i64 - 1;
-    while pat_idx >= 0 {
-        let status = scores[pat_idx as usize][next_col];
-        next_col = status.back_ref as usize;
-        picked.push(status.idx);
-        pat_idx -= 1;
-    }
-    picked.reverse();
-    Some((final_score, picked))
-}
-
-#[derive(Clone, Copy, Debug)]
-struct MatchingStatus {
-    pub idx: IndexType,
-    pub score: ScoreType,
-    pub final_score: ScoreType,
-    pub adj_num: IndexType,
-    pub back_ref: IndexType,
-}
-
-impl Default for MatchingStatus {
-    fn default() -> Self {
-        MatchingStatus {
-            idx: 0,
-            score: 0,
-            final_score: 0,
-            adj_num: 1,
-            back_ref: 0,
-        }
-    }
-}
-
-fn build_graph(choice: &str, pattern: &str) -> Option<Vec<Vec<MatchingStatus>>> {
-    let mut scores = vec![];
-
-    let mut match_start_idx = 0; // to ensure that the pushed char are able to match the pattern
-    let mut pat_prev_ch = '\0';
-
-    // initialize the match positions and inline scores
-    for (pat_idx, pat_ch) in pattern.chars().enumerate() {
-        let mut vec = vec![];
-        let mut choice_prev_ch = '\0';
-        for (idx, ch) in choice.chars().enumerate() {
-            if char_equal(ch, pat_ch, false) && idx >= match_start_idx {
-                let score = fuzzy_score(
-                    ch,
-                    idx as IndexType,
-                    choice_prev_ch,
-                    pat_ch,
-                    pat_idx as IndexType,
-                    pat_prev_ch,
-                );
-                vec.push(MatchingStatus {
-                    idx: idx as IndexType,
-                    score,
-                    final_score: score,
-                    adj_num: 1,
-                    back_ref: 0,
-                });
-            }
-            choice_prev_ch = ch;
-        }
-
-        if vec.is_empty() {
-            // not matched
-            return None;
-        }
-        match_start_idx = vec[0].idx + 1;
-        scores.push(vec);
-        pat_prev_ch = pat_ch;
-    }
-
-    // calculate max scores considering adjacent characters
-    for pat_idx in 1..scores.len() {
-        let (first_half, last_half) = scores.split_at_mut(pat_idx);
-
-        let prev_row = &first_half[first_half.len() - 1];
-        let cur_row = &mut last_half[0];
-
-        for idx in 0..cur_row.len() {
-            let next = cur_row[idx];
-            let prev = if idx > 0 {
-                cur_row[idx - 1]
-            } else {
-                MatchingStatus::default()
-            };
-
-            let mut score_before_idx = prev.final_score - prev.score + next.score;
-            score_before_idx += PENALTY_UNMATCHED * ((next.idx - prev.idx) as ScoreType);
-            score_before_idx -= if prev.adj_num == 0 { BONUS_ADJACENCY } else { 0 };
-
-            let (back_ref, score, adj_num) = prev_row
-                .iter()
-                .enumerate()
-                .take_while(|&(_, &MatchingStatus { idx, .. })| idx < next.idx)
-                .skip_while(|&(_, &MatchingStatus { idx, .. })| idx < prev.idx)
-                .map(|(back_ref, cur)| {
-                    let adj_num = next.idx - cur.idx - 1;
-                    let mut final_score = cur.final_score + next.score;
-                    final_score += if adj_num == 0 {
-                        BONUS_ADJACENCY
-                    } else {
-                        PENALTY_UNMATCHED * adj_num as ScoreType
-                    };
-                    (back_ref, final_score, adj_num)
-                })
-                .max_by_key(|&(_, x, _)| x)
-                .unwrap_or((prev.back_ref, score_before_idx, prev.adj_num));
-
-            cur_row[idx] = if idx > 0 && score < score_before_idx {
-                MatchingStatus {
-                    final_score: score_before_idx,
-                    back_ref: prev.back_ref,
-                    adj_num,
-                    ..next
-                }
-            } else {
-                MatchingStatus {
-                    final_score: score,
-                    back_ref: back_ref as IndexType,
-                    adj_num,
-                    ..next
-                }
-            };
-        }
-    }
-
-    Some(scores)
-}
-
-// judge how many scores the current index should get
-fn fuzzy_score(
-    choice_ch: char,
-    choice_idx: IndexType,
-    choice_prev_ch: char,
-    pat_ch: char,
-    pat_idx: IndexType,
-    _pat_prev_ch: char,
-) -> ScoreType {
-    let mut score = BONUS_MATCHED;
-
-    let choice_prev_ch_type = CharType::of(choice_prev_ch);
-    let choice_role = CharRole::of(choice_prev_ch, choice_ch);
-
-    if pat_ch == choice_ch {
-        if pat_ch.is_uppercase() {
-            score += BONUS_UPPER_MATCH;
-        } else {
-            score += BONUS_CASE_MATCH;
-        }
-    } else {
-        score += PENALTY_CASE_UNMATCHED;
-    }
-
-    // apply bonus for camelCases
-    if choice_role == CharRole::Head || choice_role == CharRole::Break || choice_role == CharRole::Camel {
-        score += BONUS_CAMEL;
-    }
-
-    // apply bonus for matches after a separator
-    if choice_prev_ch_type == CharType::HardSep || choice_prev_ch_type == CharType::SoftSep {
-        score += BONUS_SEPARATOR;
-    }
-
-    if pat_idx == 0 {
-        score += max((choice_idx as ScoreType) * PENALTY_LEADING, PENALTY_MAX_LEADING);
-    }
-
-    score
-}
-
 #[derive(Copy, Clone, Debug)]
 /// Configuration for skim's scoring algorithm
 pub struct SkimScoreConfig {
@@ -520,9 +283,6 @@ enum CharRole {
 }
 
 impl CharRole {
-    pub fn of(prev: char, cur: char) -> Self {
-        Self::of_type(CharType::of(prev), CharType::of(cur))
-    }
     pub fn of_type(prev: CharType, cur: CharType) -> Self {
         match (prev, cur) {
             (CharType::Empty, _) | (CharType::HardSep, _) => CharRole::Head,
diff --git a/src/options.rs b/src/options.rs
@@ -175,16 +175,16 @@ pub struct SkimOptions {
 
     /// Fuzzy matching algorithm
     ///
-    /// skim_v2 Latest skim algorithm, should be better in almost any case
-    /// skim_v1 Legacy skim algorithm
+    /// arinae (ari) Latest algorithm
+    /// skim_v2 Legacy skim algorithm
     /// clangd  Used in clangd for keyword completion
     /// fzy     Algorithm from fzy (https://github.com/jhawthorn/fzy)
     #[cfg_attr(
         feature = "cli",
         arg(
             long = "algo",
-            default_value = "skim_v2",
             value_enum,
+            default_value = "arinae",
             help_heading = "Search",
             verbatim_doc_comment
         )
diff --git a/tests/matcher.rs b/tests/matcher.rs
@@ -61,27 +61,24 @@ insta_test!(matcher_default, INPUT_ITEMS, &["-q", "stum"], {
 insta_test!(matcher_skim_v2, INPUT_ITEMS, &["-q", "stum", "--algo", "skim_v2"], {
     @snap;
 });
-insta_test!(matcher_skim_v1, INPUT_ITEMS, &["-q", "stum", "--algo", "skim_v1"], {
-    @snap;
-});
 insta_test!(matcher_clangd, INPUT_ITEMS, &["-q", "stum", "--algo", "clangd"], {
     @snap;
 });
 insta_test!(matcher_frizbee, INPUT_ITEMS, &["-q", "stum", "--algo", "frizbee", "--no-typos"], {
     @snap;
 });
-insta_test!(matcher_frizbee_typos, INPUT_ITEMS, &["-q", "stum", "--algo", "frizbee"], {
+insta_test!(matcher_frizbee_typos, INPUT_ITEMS, &["-q", "stum", "--algo", "frizbee", "--typos"], {
     @snap;
 });
 insta_test!(matcher_fzy, INPUT_ITEMS, &["-q", "stum", "--algo", "fzy", "--no-typos"], {
     @snap;
 });
-insta_test!(matcher_fzy_typos, INPUT_ITEMS, &["-q", "stum", "--algo", "fzy"], {
+insta_test!(matcher_fzy_typos, INPUT_ITEMS, &["-q", "stum", "--algo", "fzy", "--typos"], {
     @snap;
 });
 insta_test!(matcher_arinae, INPUT_ITEMS, &["-q", "stum", "--algo", "arinae", "--no-typos"], {
     @snap;
 });
-insta_test!(matcher_arinae_typos, INPUT_ITEMS, &["-q", "stum", "--algo", "arinae"], {
+insta_test!(matcher_arinae_typos, INPUT_ITEMS, &["-q", "stum", "--algo", "arinae", "--typos"], {
     @snap;
 });
diff --git a/tests/snapshots/normalize__insta_normalize_case_insensitive-2.snap b/tests/snapshots/normalize__insta_normalize_case_insensitive-2.snap
@@ -20,10 +20,10 @@ expression: buf + & cursor_pos
 "                                                                                "
 "                                                                                "
 "                                                                                "
-"  CAFE                                                                          "
-"  Café                                                                          "
 "  cafe                                                                          "
-"> café                                                                          "
+"  café                                                                          "
+"  CAFE                                                                          "
+"> Café                                                                          "
 "  4/4                                                                        0/0"
 "> cafe                                                                          "
 cursor: (24, 7)
diff --git a/tests/snapshots/tiebreak__tiebreak_neg_pathname-2.snap b/tests/snapshots/tiebreak__tiebreak_neg_pathname-2.snap
@@ -21,8 +21,8 @@ expression: buf + & cursor_pos
 "                                                                                "
 "                                                                                "
 "                                                                                "
-"  baz/foo                                                                       "
 "  foo                                                                           "
+"  baz/foo                                                                       "
 "> foo/bar                                                                       "
 "  3/3                                                                        0/0"
 "> foo                                                                           "
diff --git a/tests/snapshots/tiebreak__tiebreak_pathname-2.snap b/tests/snapshots/tiebreak__tiebreak_pathname-2.snap
@@ -22,8 +22,8 @@ expression: buf + & cursor_pos
 "                                                                                "
 "                                                                                "
 "  foo/bar                                                                       "
-"  baz/foo                                                                       "
-"> foo                                                                           "
+"  foo                                                                           "
+"> baz/foo                                                                       "
 "  3/3                                                                        0/0"
 "> foo                                                                           "
 cursor: (24, 6)
diff --git a/tests/unix.rs b/tests/unix.rs

Original file line number	Diff line number	Diff line change
`@@ -85,6 +85,6 @@ impl Atom for char {`
`85`	`85`	`}`
`86`	`86`	`#[inline(always)]`
`87`	`87`	`fn is_lowercase(self) -> bool {`
`88`		`- self.is_ascii_lowercase()`
	`88`	`+ self.is_lowercase()`
`89`	`89`	`}`
`90`	`90`	`}`