darkmatter
diff --git a/‎README.md‎
Lines changed: 1 addition & 1 deletion b/‎README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎apps/native/.storybook/mocks/tauri-runtime.ts‎
Lines changed: 1 addition & 0 deletions b/‎apps/native/.storybook/mocks/tauri-runtime.ts‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎apps/native/src-tauri/src/cli.rs‎
Lines changed: 25 additions & 5 deletions b/‎apps/native/src-tauri/src/cli.rs‎
Lines changed: 25 additions & 5 deletions
diff --git a/‎apps/native/src-tauri/src/commands/ui_prefs.rs‎
Lines changed: 7 additions & 0 deletions b/‎apps/native/src-tauri/src/commands/ui_prefs.rs‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎apps/native/src-tauri/src/evolve/mod.rs‎
Lines changed: 80 additions & 38 deletions b/‎apps/native/src-tauri/src/evolve/mod.rs‎
Lines changed: 80 additions & 38 deletions
diff --git a/‎apps/native/src-tauri/src/main.rs‎
Lines changed: 2 additions & 0 deletions b/‎apps/native/src-tauri/src/main.rs‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎apps/native/src-tauri/src/shared_types/prefs.rs‎
Lines changed: 6 additions & 2 deletions b/‎apps/native/src-tauri/src/shared_types/prefs.rs‎
Lines changed: 6 additions & 2 deletions
diff --git a/‎apps/native/src-tauri/src/storage/store.rs‎
Lines changed: 13 additions & 0 deletions b/‎apps/native/src-tauri/src/storage/store.rs‎
Lines changed: 13 additions & 0 deletions
@@ -193,7 +193,7 @@ nixmac evolve "install ripgrep and fd"
 # With options
 nixmac evolve "enable Touch ID for sudo" \
   --config ~/.darwin \
-  --max-iterations 10 \
+  --max-token-budget 50000 \
   --max-output-tokens 32768 \
   --evolve-provider ollama \
   --evolve-model qwen3-coder:30b
 
@@ -59,6 +59,7 @@ const prefs = {
   evolveProvider: "openai",
   evolveModel: "gpt-5",
   maxIterations: 25,
+  maxTokenBudget: 50_000,
   maxBuildAttempts: 3,
   maxOutputTokens: 32768,
   sendDiagnostics: true,
 
@@ -3,7 +3,7 @@
 //! Usage:
 //!   nixmac evolve "your prompt here"
 //!   nixmac evolve "your prompt" --config /path/to/config
-//!   nixmac evolve "your prompt" --max-iterations 5 --host aarch64-darwin
+//!   nixmac evolve "your prompt" --max-token-budget 50000 --host aarch64-darwin
 //!
 //! NOTE NOTE NOTE: If you pass any CLI arguments corresponding to settings that
 //! come from the app store, those CLI arguments will override the store values
@@ -25,6 +25,7 @@ pub struct EvolveConfig {
     pub config: Option<PathBuf>,
     pub max_iterations: Option<usize>,
     pub max_output_tokens: Option<usize>,
+    pub max_token_budget: Option<u32>,
     pub evolve_provider: Option<String>,
     pub evolve_model: Option<String>,
     pub summary_provider: Option<String>,
@@ -55,14 +56,18 @@ pub enum Commands {
         #[arg(short, long)]
         config: Option<PathBuf>,
 
-        /// Maximum iterations for the evolution
-        #[arg(short, long)]
+        /// Legacy fallback for providers that do not report token usage
+        #[arg(short, long, hide = true)]
         max_iterations: Option<usize>,
 
         /// Maximum output tokens requested per evolution model call
         #[arg(long)]
         max_output_tokens: Option<usize>,
 
+        /// Maximum provider-reported tokens for the evolution
+        #[arg(long)]
+        max_token_budget: Option<u32>,
+
         /// Provider for evolution (e.g., openai, openrouter, ollama)
         #[arg(long)]
         evolve_provider: Option<String>,
@@ -108,6 +113,7 @@ pub async fn handle_evolve_command(app: &AppHandle, cfg: EvolveConfig) -> Result
         config,
         max_iterations,
         max_output_tokens,
+        max_token_budget,
         evolve_provider,
         evolve_model,
         summary_provider,
@@ -192,7 +198,7 @@ pub async fn handle_evolve_command(app: &AppHandle, cfg: EvolveConfig) -> Result
         None => crate::storage::store::get_summary_model(app).ok().flatten(),
     };
 
-    // Effective max iterations: prefer CLI value, otherwise read from store (has default)
+    // Effective legacy iteration fallback: prefer CLI value, otherwise read from store (has default)
     let effective_max_iterations: usize = match max_iterations {
         Some(v) => v,
         None => crate::storage::store::get_max_iterations(app)
@@ -204,7 +210,14 @@ pub async fn handle_evolve_command(app: &AppHandle, cfg: EvolveConfig) -> Result
             .unwrap_or(crate::storage::store::DEFAULT_MAX_OUTPUT_TOKENS),
     };
 
-    // Max iterations
+    // Effective max token budget: prefer CLI value, otherwise read from store (has default)
+    let effective_max_token_budget: u32 = match max_token_budget {
+        Some(v) => v,
+        None => crate::storage::store::get_max_token_budget(app)
+            .unwrap_or(crate::storage::store::DEFAULT_MAX_TOKEN_BUDGET),
+    };
+
+    // Legacy max iterations
     if let Some(iterations) = max_iterations {
         crate::storage::store::set_max_iterations(app, iterations)
             .map_err(|e| format!("Failed to set max iterations: {}", e))?;
@@ -215,6 +228,12 @@ pub async fn handle_evolve_command(app: &AppHandle, cfg: EvolveConfig) -> Result
             .map_err(|e| format!("Failed to set max output tokens: {}", e))?;
     }
 
+    // Max token budget
+    if let Some(token_budget) = max_token_budget {
+        crate::storage::store::set_max_token_budget(app, token_budget)
+            .map_err(|e| format!("Failed to set max token budget: {}", e))?;
+    }
+
     // Host
     if let Some(ref host_attr) = host {
         crate::storage::store::set_host_attr(app, host_attr)
@@ -273,6 +292,7 @@ pub async fn handle_evolve_command(app: &AppHandle, cfg: EvolveConfig) -> Result
             "prompt": prompt,
             "maxIterations": effective_max_iterations,
             "maxOutputTokens": effective_max_output_tokens,
+            "maxTokenBudget": effective_max_token_budget,
             "evolveProvider": effective_evolve_provider,
             "evolveModel": effective_evolve_model,
             "summaryProvider": effective_summary_provider,
 
@@ -29,6 +29,8 @@ pub async fn ui_get_prefs(app: AppHandle) -> Result<shared_types::UiPrefs, Strin
 
     let max_iterations =
         Some(store::get_max_iterations(&app).unwrap_or(store::DEFAULT_MAX_ITERATIONS));
+    let max_token_budget =
+        Some(store::get_max_token_budget(&app).unwrap_or(store::DEFAULT_MAX_TOKEN_BUDGET));
     let max_build_attempts = Some(store::get_max_build_attempts(&app).unwrap_or(5));
     let max_output_tokens =
         Some(store::get_max_output_tokens(&app).unwrap_or(store::DEFAULT_MAX_OUTPUT_TOKENS));
@@ -90,6 +92,7 @@ pub async fn ui_get_prefs(app: AppHandle) -> Result<shared_types::UiPrefs, Strin
         summary_model,
 
         max_iterations,
+        max_token_budget,
         max_build_attempts,
         max_output_tokens,
 
@@ -143,6 +146,10 @@ pub async fn ui_set_prefs(
         store::set_max_iterations(&app, max_iterations)
             .map_err(|e| capture_err("ui_set_prefs", e))?;
     }
+    if let Some(max_token_budget) = prefs.max_token_budget {
+        store::set_max_token_budget(&app, max_token_budget)
+            .map_err(|e| capture_err("ui_set_prefs", e))?;
+    }
     if let Some(max_build_attempts) = prefs.max_build_attempts {
         store::set_max_build_attempts(&app, max_build_attempts)
             .map_err(|e| capture_err("ui_set_prefs", e))?;
 
@@ -327,9 +327,9 @@ fn log_api_error(
 const DEFAULT_MODEL: &str = "anthropic/claude-sonnet-4";
 const DEFAULT_OLLAMA_API_BASE: &str = "http://localhost:11434";
 
-// Percentage of max_iterations after which we require at least one edit/build_check.
-// Example: with max_iterations=50 and this set to 75, threshold is 37 iterations.
-const MAX_ITERATIONS_BEFORE_EDIT_PERCENT: usize = 75;
+// Percentage of the token budget after which we require at least one edit/build_check.
+// Example: with maxTokenBudget=50,000 and this set to 75, threshold is 37,500 tokens.
+const MAX_TOKEN_BUDGET_BEFORE_EDIT_PERCENT: u32 = 75;
 
 // Applied separately to stdout and stderr. So when thinking about tokens,
 // the effective output limit could be up to double this if both are long.
@@ -690,22 +690,26 @@ pub async fn generate_evolution<R: Runtime>(
 
     // Read configurable limits from store (hot-reloaded on every run).
     let config::EvolutionLimits {
-        max_iterations,
         max_build_attempts,
+        ..
     } = config::EvolutionLimits::load(app)
         .inspect_err(|e| warn!("EvolutionLimits::load failed ({e}); using defaults"))
         .unwrap_or_default();
-    let max_iterations_before_edit = std::cmp::max(
+    let legacy_max_iterations =
+        store::get_max_iterations(app).unwrap_or(store::DEFAULT_MAX_ITERATIONS);
+    let max_token_budget =
+        store::get_max_token_budget(app).unwrap_or(store::DEFAULT_MAX_TOKEN_BUDGET);
+    let max_tokens_before_edit = std::cmp::max(
         1,
-        (max_iterations * MAX_ITERATIONS_BEFORE_EDIT_PERCENT) / 100,
+        (max_token_budget * MAX_TOKEN_BUDGET_BEFORE_EDIT_PERCENT) / 100,
     );
     info!(
-        "Limits: max_iterations={}, max_iterations_before_edit={} ({}%), max_build_attempts={}, max_output_tokens={}",
-        max_iterations,
-        max_iterations_before_edit,
-        MAX_ITERATIONS_BEFORE_EDIT_PERCENT,
+        "Limits: max_token_budget={}, max_tokens_before_edit={} ({}%), max_build_attempts={}, legacy_max_iterations={}",
+        max_token_budget,
+        max_tokens_before_edit,
+        MAX_TOKEN_BUDGET_BEFORE_EDIT_PERCENT,
         max_build_attempts,
-        max_output_tokens
+        legacy_max_iterations,
     );
 
     let tools = create_tools(banned_tools);
@@ -719,6 +723,7 @@ pub async fn generate_evolution<R: Runtime>(
     let mut build_attempts: usize = 0;
     let mut build_verified = false;
     let mut total_tokens: u32 = 0;
+    let mut token_usage_observed = false;
     let chat_memory_store = session_chat_memory_store();
 
     // Restore only persisted conversational history (user/assistant, NOT tool)
@@ -923,14 +928,21 @@ pub async fn generate_evolution<R: Runtime>(
 
         // Track token usage
         if let Some(usage) = &response.usage {
-            total_tokens += usage.total;
+            token_usage_observed = true;
+            total_tokens = total_tokens.saturating_add(usage.total);
             info!(
-                "📊 Tokens | this_call: {} (in={}, out={}) | total_session: {}",
-                usage.total, usage.input, usage.output, total_tokens
+                "📊 Tokens | this_call: {} (in={}, out={}) | total_session: {}/{}",
+                usage.total, usage.input, usage.output, total_tokens, max_token_budget
             );
             emit_evolve_event(
                 app,
-                EvolveEvent::api_response(start_time, iteration, usage.total),
+                EvolveEvent::api_response(
+                    start_time,
+                    iteration,
+                    usage.total,
+                    total_tokens,
+                    max_token_budget,
+                ),
             );
         }
 
@@ -1298,27 +1310,58 @@ Do not invent tool names and do not place tool invocations in assistant content.
             break;
         }
 
-        // Safety limits -- Max Iterations Before Edit Check
-        if iteration == max_iterations_before_edit && !(made_edit || made_build_check) {
+        // Safety limits -- Max Token Budget
+        if total_tokens >= max_token_budget {
+            warn!(
+                "⚠️ Evolution reached token budget ({}/{}) - aborting",
+                total_tokens, max_token_budget
+            );
+            evolution.state = EvolutionState::Failed;
+            let stop_reason = format!(
+                "Token budget exhausted ({} of {} tokens)",
+                total_tokens, max_token_budget
+            );
+            emit_evolve_event(
+                app,
+                EvolveEvent::error(start_time, Some(iteration), &stop_reason, &stop_reason),
+            );
+            // Track failure
+            if let Err(e) = statistics::record_evolution_failure(app, iteration) {
+                warn!("Failed to record evolution failure stats: {}", e);
+            }
+            return Err(EvolutionRunError::from_state(
+                format!(
+                    "Evolution stopped because the token budget was exhausted ({} of {} tokens)",
+                    total_tokens, max_token_budget
+                ),
+                &evolution,
+                iteration,
+                build_attempts,
+                total_tokens,
+            )
+            .into());
+        }
+
+        // Safety limits -- Token Budget Before Edit Check
+        if total_tokens >= max_tokens_before_edit && !made_edit_or_build_check {
             warn!(
-                "⚠️ No edit or build_check by iteration {} - agent not making progress",
-                max_iterations_before_edit
+                "⚠️ No edit or build_check after {} tokens - agent not making progress",
+                total_tokens
             );
             evolution.state = EvolutionState::Failed;
             let message = format!(
-                "I've analyzed your configuration for {} iterations but haven't started making concrete changes yet. \
+                "I've analyzed your configuration for {} tokens but haven't started making concrete changes yet. \
 This suggests I'm having difficulty understanding what modifications you'd like. \
 Could you provide more specific guidance on what aspects of your configuration need adjustment?",
-                max_iterations_before_edit
+                total_tokens
+            );
+            let stop_reason = format!(
+                "No concrete progress after {} of {} token budget",
+                total_tokens, max_token_budget
             );
             emit_evolve_event(
                 app,
-                EvolveEvent::error(
-                    start_time,
-                    Some(iteration),
-                    &format!("Maximum iterations exceeded ({})", max_iterations),
-                    &format!("Maximum iterations exceeded ({})", max_iterations),
-                ),
+                EvolveEvent::error(start_time, Some(iteration), &stop_reason, &stop_reason),
             );
             // Track failure
             if let Err(e) = statistics::record_evolution_failure(app, iteration) {
@@ -1334,28 +1377,27 @@ Could you provide more specific guidance on what aspects of your configuration n
             .into());
         }
 
-        // Safety limits -- Max Iterations
-        if iteration >= max_iterations {
+        // Safety limits -- Unmetered Provider Fallback
+        if !token_usage_observed && iteration >= legacy_max_iterations {
             warn!(
-                "⚠️ Evolution exceeded maximum iterations ({}) - aborting",
-                max_iterations
+                "⚠️ Provider has not reported token usage after {} calls - aborting",
+                legacy_max_iterations
             );
             evolution.state = EvolutionState::Failed;
+            let stop_reason = format!(
+                "Provider did not report token usage; stopped after {} unmetered AI calls",
+                legacy_max_iterations
+            );
             emit_evolve_event(
                 app,
-                EvolveEvent::error(
-                    start_time,
-                    Some(iteration),
-                    &format!("Maximum iterations exceeded ({})", max_iterations),
-                    &format!("Maximum iterations exceeded ({})", max_iterations),
-                ),
+                EvolveEvent::error(start_time, Some(iteration), &stop_reason, &stop_reason),
             );
             // Track failure
             if let Err(e) = statistics::record_evolution_failure(app, iteration) {
                 warn!("Failed to record evolution failure stats: {}", e);
             }
             return Err(EvolutionRunError::from_state(
-                format!("Evolution exceeded maximum iterations ({})", max_iterations),
+                stop_reason,
                 &evolution,
                 iteration,
                 build_attempts,
 
@@ -303,6 +303,7 @@ fn run_cli_mode(context: tauri::Context<tauri::Wry>) -> i32 {
             config,
             max_iterations,
             max_output_tokens,
+            max_token_budget,
             evolve_provider,
             evolve_model,
             summary_provider,
@@ -359,6 +360,7 @@ fn run_cli_mode(context: tauri::Context<tauri::Wry>) -> i32 {
                     config,
                     max_iterations,
                     max_output_tokens,
+                    max_token_budget,
                     evolve_provider,
                     evolve_model,
                     summary_provider,
 
@@ -32,8 +32,10 @@ pub struct UiPrefs {
     pub evolve_provider: Option<String>,
     /// Model used for AI evolution.
     pub evolve_model: Option<String>,
-    /// Maximum agent iterations per evolution.
+    /// Legacy maximum agent iterations per evolution.
     pub max_iterations: Option<usize>,
+    /// Maximum provider-reported tokens per evolution.
+    pub max_token_budget: Option<u32>,
     /// Maximum build attempts per evolution.
     pub max_build_attempts: Option<usize>,
     /// Maximum output tokens requested per evolution model call.
@@ -77,8 +79,10 @@ pub struct UiPrefsUpdate {
     pub summary_provider: Option<String>,
     /// Summary model update.
     pub summary_model: Option<String>,
-    /// Maximum iteration count update.
+    /// Legacy maximum iteration count update.
     pub max_iterations: Option<usize>,
+    /// Maximum token budget update.
+    pub max_token_budget: Option<u32>,
     /// Maximum build-attempt count update.
     pub max_build_attempts: Option<usize>,
     /// Maximum output token count update.
 
@@ -42,6 +42,7 @@ pub const UPDATE_CHANNEL_KEY: &str = "updateChannel";
 
 pub const DEFAULT_MAX_ITERATIONS: usize = 25;
 pub const DEFAULT_MAX_OUTPUT_TOKENS: usize = 32_768;
+pub const DEFAULT_MAX_TOKEN_BUDGET: u32 = 50_000;
 const KEYCHAIN_SERVICE: &str = "com.darkmatter.nixmac";
 
 fn e2e_mock_system_enabled() -> bool {
@@ -542,6 +543,18 @@ pub fn set_max_iterations<R: Runtime>(app: &AppHandle<R>, max: usize) -> Result<
     Ok(())
 }
 
+/// Gets the maximum token budget for evolution (default: 50,000).
+pub fn get_max_token_budget<R: Runtime>(app: &AppHandle<R>) -> Result<u32> {
+    Ok(get_json_pref(app, "maxTokenBudget")?.unwrap_or(DEFAULT_MAX_TOKEN_BUDGET))
+}
+
+pub fn set_max_token_budget<R: Runtime>(app: &AppHandle<R>, max: u32) -> Result<()> {
+    let store = get_store(app)?;
+    store.set("maxTokenBudget", serde_json::json!(max));
+    store.save()?;
+    Ok(())
+}
+
 /// Gets the maximum build attempts for evolution (default: 5). Repo-scoped.
 pub fn get_max_build_attempts<R: Runtime>(app: &AppHandle<R>) -> Result<usize> {
     if let Some(limits) =