tinyhumansai · senamakel · May 13, 2026 · May 12, 2026 · May 12, 2026 · May 12, 2026
@@ -84,7 +84,10 @@ jobs:
       - name: Install cargo-llvm-cov
         uses: taiki-e/install-action@cargo-llvm-cov
       - name: Run cargo llvm-cov for openhuman core
-        run: cargo llvm-cov -p openhuman --lcov --output-path lcov-core.info
+        # See test.yml `Test core crate` for why `--test-threads=1` is
+        # required: process-wide singletons in scheduler_gate / local_ai
+        # do not isolate cleanly across parallel `#[tokio::test]` runtimes.
+        run: cargo llvm-cov -p openhuman --lcov --output-path lcov-core.info -- --test-threads=1
       - name: Upload core lcov
         uses: actions/upload-artifact@v5
         with:

@@ -83,7 +83,14 @@ jobs:
         uses: mozilla-actions/sccache-action@v0.0.9
 
       - name: Test core crate (openhuman)
-        run: cargo test -p openhuman
+        # Serialize tests: several modules share process-wide singletons
+        # (`scheduler_gate::LLM_PERMITS` semaphore, `scheduler_gate::STATE`,
+        # `LOCAL_AI_TEST_MUTEX`, `BUS_HANDLER_LOCK`) that don't cleanly
+        # isolate when `#[tokio::test]` runtimes run in parallel — on the
+        # CI runner some waiters never get woken when another runtime
+        # drops the permit, wedging the whole binary. Runs in ~90s; the
+        # underlying isolation refactor is tracked separately.
+        run: cargo test -p openhuman -- --test-threads=1
 
   rust-tauri-tests:
     name: Rust Tauri Shell Tests

@@ -40,6 +40,8 @@ use crate::openhuman::providers::reliable::{
     is_rate_limited, is_upstream_unhealthy, parse_retry_after_ms,
 };
 use crate::openhuman::providers::ChatMessage;
+use crate::openhuman::scheduler_gate::LlmPermit;
+use std::future::Future;
 
 use crate::openhuman::config::Config;
 
@@ -149,20 +151,53 @@ pub async fn run_triage(envelope: &TriggerEnvelope) -> anyhow::Result<TriageOutc
         .context("resolving provider for triage turn")?;
     let local = build_local_provider_with_config(&config);
 
-    let outcome = run_triage_with_arms(cloud, local, envelope).await;
+    let outcome = run_triage_with_arms_inner(cloud, local, envelope, || {
+        crate::openhuman::scheduler_gate::wait_for_capacity()
+    })
+    .await;
     if let Err(err) = &outcome {
         events::publish_failed(envelope, &format!("{err}"));
     }
     outcome
 }
 
 /// Inner driver for [`run_triage`] that takes already-resolved arms.
-/// Tests inject stub providers via this entry point.
+/// Tests inject stub providers via this entry point and acquire the
+/// global LLM permit for the local arm via the production gate.
 pub async fn run_triage_with_arms(
     cloud: ResolvedProvider,
     local: Option<ResolvedProvider>,
     envelope: &TriggerEnvelope,
 ) -> anyhow::Result<TriageOutcome> {
+    run_triage_with_arms_inner(cloud, local, envelope, || {
+        crate::openhuman::scheduler_gate::wait_for_capacity()
+    })
+    .await
+}
+
+/// Test-only entry point: skip the global LLM permit acquisition so the
+/// triage tests don't contend with `scheduler_gate`'s process-wide
+/// 1-slot semaphore or get trapped by a stale `Paused` policy left in
+/// `STATE` by another test's `init_global` call.
+#[cfg(test)]
+pub async fn run_triage_with_arms_for_test(
+    cloud: ResolvedProvider,
+    local: Option<ResolvedProvider>,
+    envelope: &TriggerEnvelope,
+) -> anyhow::Result<TriageOutcome> {
+    run_triage_with_arms_inner(cloud, local, envelope, || async { None }).await
+}
+
+async fn run_triage_with_arms_inner<F, Fut>(
+    cloud: ResolvedProvider,
+    local: Option<ResolvedProvider>,
+    envelope: &TriggerEnvelope,
+    acquire_permit: F,
+) -> anyhow::Result<TriageOutcome>
+where
+    F: FnOnce() -> Fut,
+    Fut: Future<Output = Option<LlmPermit>>,
+{
     // ── Cloud arm ──────────────────────────────────────────────────
     match try_arm(&cloud, envelope, TriageResolutionPath::Cloud).await {
         Ok(run) => return Ok(TriageOutcome::Decision(run)),
@@ -209,7 +244,7 @@ pub async fn run_triage_with_arms(
 
     // Hold the global LLM permit for the lifetime of the local turn —
     // protects laptop RAM from concurrent local model calls (#1073).
-    let _gate_permit = crate::openhuman::scheduler_gate::wait_for_capacity().await;
+    let _gate_permit = acquire_permit().await;
 
     match try_arm(&local, envelope, TriageResolutionPath::LocalFallback).await {
         Ok(run) => Ok(TriageOutcome::Decision(run)),

@@ -154,7 +154,7 @@ async fn happy_path_returns_cloud_resolution() {
     })
     .await;
 
-    let outcome = run_triage_with_arms(cloud_arm(), Some(local_arm()), &envelope())
+    let outcome = run_triage_with_arms_for_test(cloud_arm(), Some(local_arm()), &envelope())
         .await
         .expect("happy path must succeed");
 
@@ -184,7 +184,7 @@ async fn rate_limited_then_ok_marks_cloud_after_retry() {
     })
     .await;
 
-    let outcome = run_triage_with_arms(cloud_arm(), Some(local_arm()), &envelope())
+    let outcome = run_triage_with_arms_for_test(cloud_arm(), Some(local_arm()), &envelope())
         .await
         .expect("retry path must succeed");
 
@@ -219,7 +219,7 @@ async fn double_429_falls_through_to_local_fallback() {
     })
     .await;
 
-    let outcome = run_triage_with_arms(cloud_arm(), Some(local_arm()), &envelope())
+    let outcome = run_triage_with_arms_for_test(cloud_arm(), Some(local_arm()), &envelope())
         .await
         .expect("local fallback must succeed");
 
@@ -252,7 +252,7 @@ async fn cloud_5xx_falls_through_to_local_fallback() {
     })
     .await;
 
-    let outcome = run_triage_with_arms(cloud_arm(), Some(local_arm()), &envelope())
+    let outcome = run_triage_with_arms_for_test(cloud_arm(), Some(local_arm()), &envelope())
         .await
         .expect("local fallback must succeed after 5xx");
 
@@ -276,7 +276,7 @@ async fn cloud_then_local_failure_returns_deferred() {
     })
     .await;
 
-    let outcome = run_triage_with_arms(cloud_arm(), Some(local_arm()), &envelope())
+    let outcome = run_triage_with_arms_for_test(cloud_arm(), Some(local_arm()), &envelope())
         .await
         .expect("Deferred is Ok, not Err");
 
@@ -314,7 +314,7 @@ async fn fatal_cloud_error_short_circuits_without_local_attempt() {
     })
     .await;
 
-    let err = run_triage_with_arms(cloud_arm(), Some(local_arm()), &envelope())
+    let err = run_triage_with_arms_for_test(cloud_arm(), Some(local_arm()), &envelope())
         .await
         .expect_err("auth failure must surface as Err");
 
@@ -345,7 +345,7 @@ async fn no_local_arm_returns_deferred_after_cloud_exhaustion() {
     })
     .await;
 
-    let outcome = run_triage_with_arms(cloud_arm(), None, &envelope())
+    let outcome = run_triage_with_arms_for_test(cloud_arm(), None, &envelope())
         .await
         .expect("Deferred is Ok");