perf(windows): use 75% of CPU cores for whisper inference

rodrigoluizs · rodrigoluizs · commit 132584edb984 · 2026-03-14T13:21:05.000+01:00
On macOS Metal GPU handles compute so thread count is less critical.
On Windows (CPU-only), whisper defaults to 4 threads which wastes
available cores. Using 75% of available cores nearly halves inference
time on a 16-core system (7.6s -&gt; 4.0s for 11s of audio).
diff --git a/src/main/audio/whisper.ts b/src/main/audio/whisper.ts
@@ -47,8 +47,16 @@ export async function transcribe(
   }
 }
 
+// On macOS Metal handles compute, so threads are less critical.
+// On Windows/Linux (CPU-only), using ~75% of cores gives the best throughput
+// without starving the OS.  Minimum 4 to avoid slowdowns on low-core machines.
+const WHISPER_THREADS = process.platform === "darwin"
+  ? 4
+  : Math.max(4, Math.floor(os.cpus().length * 0.75));
+
 function runWhisper(modelPath: string, filePath: string, prompt: string, language = "auto", temperature?: number): Promise<string> {
   const args = [
+    "-t", String(WHISPER_THREADS),
     "-l", language,
     "-m", modelPath,
     "-f", filePath,