idemerge
diff --git a/‎CHANGELOG.md‎
Lines changed: 13 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎backend/package.json‎
Lines changed: 1 addition & 1 deletion b/‎backend/package.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎backend/src/services/workflowEngine.ts‎
Lines changed: 17 additions & 0 deletions b/‎backend/src/services/workflowEngine.ts‎
Lines changed: 17 additions & 0 deletions
diff --git a/‎backend/src/types.ts‎
Lines changed: 6 additions & 0 deletions b/‎backend/src/types.ts‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎frontend/package.json‎
Lines changed: 1 addition & 1 deletion b/‎frontend/package.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎frontend/src/components/ConfigPanel.tsx‎
Lines changed: 47 additions & 8 deletions b/‎frontend/src/components/ConfigPanel.tsx‎
Lines changed: 47 additions & 8 deletions
diff --git a/‎frontend/src/components/HistoryDetailPage.tsx‎
Lines changed: 63 additions & 21 deletions b/‎frontend/src/components/HistoryDetailPage.tsx‎
Lines changed: 63 additions & 21 deletions
@@ -4,6 +4,19 @@ All notable changes to this project will be documented in this file.
 
 The format is based on [Keep a Changelog](https://keepachangelog.com/), and this project adheres to [Semantic Versioning](https://semver.org/).
 
+## [2.6.0] - 2026-04-23
+
+### Added
+- Output Scope selector for long-context presets (16K/64K/150K/256K): controls how many documents the model reads, limiting output length (~500 tokens for 3 docs, unlimited for All docs)
+- Output Scope available in Benchmark, Workflow, and Playground pages with persistent selection via localStorage
+- Input/Output/Total throughput metrics in Workflow Detail: calculated as concurrency × avg tokens per request / avg response time
+- Throughput columns (In T/s, Out T/s, Total T/s) in provider comparison tables
+- Throughput summary in workflow header and results summary bar
+- Tooltips on all metric labels, table column headers, and parameter controls across all pages (WorkflowResults, ResultsPanel, ConfigPanel, PlaygroundPage, HistoryDetailPage)
+
+### Changed
+- Long-context 64K preset prompt suffix updated to support configurable output scope
+
 ## [2.5.1] - 2026-04-19
 
 ### Added
 
@@ -1,6 +1,6 @@
 {
   "name": "llm-benchmark-backend",
-  "version": "2.5.0",
+  "version": "2.6.0",
   "description": "LLM API Radar - Backend",
   "main": "dist/index.js",
   "scripts": {
 
@@ -297,10 +297,21 @@ async function generateSummary(workflow: BenchmarkWorkflow): Promise<WorkflowSum
           totalOutputTokens: 0,
           totalCost: 0,
           overallSuccessRate: 0,
+          inputThroughput: 0,
+          outputThroughput: 0,
+          totalThroughput: 0,
           perTaskMetrics: [],
         };
       }
 
+      // Calculate throughput: concurrency × avgTokensPerRequest / avgResponseTime × 1000
+      const successCount = Math.round(result.summary.successRate * task.config.iterations) || 1;
+      const avgRT = result.summary.avgResponseTime;
+      const c = task.config.concurrency;
+      const avgIn = (result.summary.totalInputTokens || 0) / successCount;
+      const avgOut = (result.summary.totalOutputTokens || 0) / successCount;
+      const avgTotal = result.summary.totalTokens / successCount;
+
       const metric: TaskMetricPoint = {
         taskId: task.id,
         taskName: task.name,
@@ -314,6 +325,9 @@ async function generateSummary(workflow: BenchmarkWorkflow): Promise<WorkflowSum
         avgFirstTokenLatency: result.summary.avgFirstTokenLatency,
         avgTokensPerSecond: result.summary.avgTokensPerSecond,
         systemThroughput: result.summary.systemThroughput || 0,
+        inputThroughput: avgRT > 0 ? Math.round((c * avgIn * 1000) / avgRT) : 0,
+        outputThroughput: avgRT > 0 ? Math.round((c * avgOut * 1000) / avgRT) : 0,
+        totalThroughput: avgRT > 0 ? Math.round((c * avgTotal * 1000) / avgRT) : 0,
         successRate: result.summary.successRate,
         estimatedCost: result.summary.estimatedCost,
       };
@@ -339,6 +353,9 @@ async function generateSummary(workflow: BenchmarkWorkflow): Promise<WorkflowSum
     summary.totalOutputTokens = metrics.reduce((a, m) => a + m.outputTokens, 0);
     summary.totalCost = Number(metrics.reduce((a, m) => a + m.estimatedCost, 0).toFixed(6));
     summary.overallSuccessRate = Number((metrics.reduce((a, m) => a + m.successRate, 0) / metrics.length).toFixed(4));
+    summary.inputThroughput = Math.round(metrics.reduce((a, m) => a + m.inputThroughput, 0) / metrics.length);
+    summary.outputThroughput = Math.round(metrics.reduce((a, m) => a + m.outputThroughput, 0) / metrics.length);
+    summary.totalThroughput = Math.round(metrics.reduce((a, m) => a + m.totalThroughput, 0) / metrics.length);
   }
 
   const startTime = workflow.startedAt ? new Date(workflow.startedAt).getTime() : Date.now();
 
@@ -201,6 +201,9 @@ export interface WorkflowProviderSummary {
   totalOutputTokens: number;
   totalCost: number;
   overallSuccessRate: number;
+  inputThroughput: number;
+  outputThroughput: number;
+  totalThroughput: number;
   perTaskMetrics: TaskMetricPoint[];
 }
 
@@ -217,6 +220,9 @@ export interface TaskMetricPoint {
   avgFirstTokenLatency: number;
   avgTokensPerSecond: number;
   systemThroughput: number;
+  inputThroughput: number;
+  outputThroughput: number;
+  totalThroughput: number;
   successRate: number;
   estimatedCost: number;
 }
 
@@ -1,7 +1,7 @@
 {
   "name": "frontend",
   "private": true,
-  "version": "2.5.1",
+  "version": "2.6.0",
   "type": "module",
   "scripts": {
     "dev": "vite",
 
@@ -8,9 +8,13 @@ import {
   QUICK_ITERATIONS,
   QUICK_WARMUP,
   QUICK_INTERVAL,
+  OUTPUT_SCOPE_OPTIONS,
+  applyOutputScope,
+  getStoredOutputScope,
+  storeOutputScope,
 } from '../constants';
 import { useProviders } from '../hooks/useProviders';
-import { Button, Input, InputNumber, Switch, Segmented } from '../antdImports';
+import { Button, Input, InputNumber, Switch, Segmented, Select, Tooltip } from '../antdImports';
 import { LoadingOutlined } from '@ant-design/icons';
 import { useTokenCount } from '../utils/tokenCount';
 import { loadHeavyPreset } from '../constants';
@@ -63,6 +67,8 @@ export function ConfigPanel({ onStart, isRunning, currentProviders: _currentProv
   const [warmupRuns, setWarmupRuns] = useState(0);
   const [requestInterval, setRequestInterval] = useState(0);
   const [randomizeInterval, setRandomizeInterval] = useState(false);
+  const [isLongContext, setIsLongContext] = useState(false);
+  const [outputScope, setOutputScope] = useState(getStoredOutputScope);
 
   const toggleModel = (provider: ProviderConfigResponse, modelName: string) => {
     const key = `${provider.id}:${modelName}`;
@@ -235,11 +241,14 @@ export function ConfigPanel({ onStart, isRunning, currentProviders: _currentProv
             <button
               key={preset.label}
               onClick={async () => {
+                const isLC = !!preset.multiDoc;
+                setIsLongContext(isLC);
                 if (preset.heavy) {
                   const bucket = preset.tokens >= 200_000 ? '256k' : preset.tokens >= 100_000 ? '150k' : '64k';
-                  setPrompt(await loadHeavyPreset(bucket));
+                  const raw = await loadHeavyPreset(bucket);
+                  setPrompt(isLC ? applyOutputScope(raw, outputScope) : raw);
                 } else {
-                  setPrompt(preset.prompt);
+                  setPrompt(isLC ? applyOutputScope(preset.prompt, outputScope) : preset.prompt);
                 }
               }}
               className={`text-[11px] px-2.5 py-1.5 rounded-md border transition-all font-medium ${
@@ -252,6 +261,26 @@ export function ConfigPanel({ onStart, isRunning, currentProviders: _currentProv
             </button>
           ))}
         </div>
+        {isLongContext && (
+          <div className="flex items-center gap-2">
+            <Tooltip title="Controls how many documents the model should read and summarize. Fewer docs = shorter output (~500 tokens for 3 docs). Use this to limit output length while keeping the full prompt as input.">
+              <label className="text-[11px] text-text-secondary font-medium whitespace-nowrap cursor-help">
+                Output Scope
+              </label>
+            </Tooltip>
+            <Select
+              size="small"
+              value={outputScope}
+              onChange={(v) => {
+                setOutputScope(v);
+                storeOutputScope(v);
+                setPrompt((prev) => applyOutputScope(prev, v));
+              }}
+              options={OUTPUT_SCOPE_OPTIONS}
+              style={{ width: 160, fontSize: 11 }}
+            />
+          </div>
+        )}
         <Input.TextArea
           value={prompt}
           onChange={(e) => setPrompt(e.target.value)}
@@ -267,7 +296,9 @@ export function ConfigPanel({ onStart, isRunning, currentProviders: _currentProv
         <label className="section-title">Parameters</label>
         <div className="grid grid-cols-3 gap-3">
           <div className="space-y-2">
-            <label className="text-[11px] text-text-secondary font-medium">Max Tokens</label>
+            <Tooltip title="Maximum number of tokens the model can generate in its response">
+              <label className="text-[11px] text-text-secondary font-medium cursor-help">Max Tokens</label>
+            </Tooltip>
             <QuickButtons options={QUICK_MAX_TOKENS} value={maxTokens} onChange={setMaxTokens} color="accent-teal" />
             <InputNumber
               value={maxTokens}
@@ -280,7 +311,9 @@ export function ConfigPanel({ onStart, isRunning, currentProviders: _currentProv
             />
           </div>
           <div className="space-y-2">
-            <label className="text-[11px] text-text-secondary font-medium">Concurrency</label>
+            <Tooltip title="Number of parallel requests sent simultaneously to the API">
+              <label className="text-[11px] text-text-secondary font-medium cursor-help">Concurrency</label>
+            </Tooltip>
             <QuickButtons
               options={QUICK_CONCURRENCY}
               value={concurrency}
@@ -298,7 +331,9 @@ export function ConfigPanel({ onStart, isRunning, currentProviders: _currentProv
             />
           </div>
           <div className="space-y-2">
-            <label className="text-[11px] text-text-secondary font-medium">Iterations</label>
+            <Tooltip title="Total number of requests to send during the benchmark">
+              <label className="text-[11px] text-text-secondary font-medium cursor-help">Iterations</label>
+            </Tooltip>
             <QuickButtons options={QUICK_ITERATIONS} value={iterations} onChange={setIterations} color="accent-teal" />
             <InputNumber
               value={iterations}
@@ -338,7 +373,9 @@ export function ConfigPanel({ onStart, isRunning, currentProviders: _currentProv
                 <label className="section-title">Advanced</label>
                 <div className="grid grid-cols-2 gap-3">
                   <div className="space-y-2">
-                    <label className="text-[11px] text-text-secondary font-medium">Warmup Runs</label>
+                    <Tooltip title="Requests to send before benchmarking starts, to warm up the API connection and caches">
+                      <label className="text-[11px] text-text-secondary font-medium cursor-help">Warmup Runs</label>
+                    </Tooltip>
                     <QuickButtons
                       options={QUICK_WARMUP}
                       value={warmupRuns}
@@ -356,7 +393,9 @@ export function ConfigPanel({ onStart, isRunning, currentProviders: _currentProv
                     />
                   </div>
                   <div className="space-y-2">
-                    <label className="text-[11px] text-text-secondary font-medium">Interval (ms)</label>
+                    <Tooltip title="Delay between consecutive requests in milliseconds">
+                      <label className="text-[11px] text-text-secondary font-medium cursor-help">Interval (ms)</label>
+                    </Tooltip>
                     <QuickButtons
                       options={QUICK_INTERVAL}
                       value={requestInterval}
 
@@ -169,7 +169,17 @@ export function HistoryDetailPage({ workflowId, onExport, onCancel, onBack }: Hi
     const outputTokens =
       workflow.summary.totalOutputTokens || summaries.reduce((a, s) => a + (s.totalOutputTokens || 0), 0);
     if (inputTokens === 0 && outputTokens === 0) return null;
-    return { inputTokens, outputTokens };
+    // Average throughput across providers
+    const avgInputThroughput = summaries.length
+      ? Math.round(summaries.reduce((a, s) => a + (s.inputThroughput || 0), 0) / summaries.length)
+      : 0;
+    const avgOutputThroughput = summaries.length
+      ? Math.round(summaries.reduce((a, s) => a + (s.outputThroughput || 0), 0) / summaries.length)
+      : 0;
+    const avgTotalThroughput = summaries.length
+      ? Math.round(summaries.reduce((a, s) => a + (s.totalThroughput || 0), 0) / summaries.length)
+      : 0;
+    return { inputTokens, outputTokens, avgInputThroughput, avgOutputThroughput, avgTotalThroughput };
   })();
 
   return (
@@ -241,26 +251,58 @@ export function HistoryDetailPage({ workflowId, onExport, onCancel, onBack }: Hi
               </div>
               {/* Token Stats */}
               {tokenStats && (
-                <div className="flex items-center gap-3 mt-2 flex-wrap">
-                  <span className="text-[11px] text-text-secondary font-mono">
-                    Input Tokens: <span className="text-accent-blue">{tokenStats.inputTokens.toLocaleString()}</span>
-                  </span>
-                  <span className="text-[11px] text-text-secondary font-mono">
-                    Output Tokens: <span className="text-accent-teal">{tokenStats.outputTokens.toLocaleString()}</span>
-                  </span>
-                  <span className="text-[11px] text-text-secondary font-mono">
-                    Ratio (In:Out):{' '}
-                    <span className="text-accent-violet">
-                      {tokenStats.outputTokens > 0 && tokenStats.inputTokens > 0
-                        ? (() => {
-                            const r = tokenStats.inputTokens / tokenStats.outputTokens;
-                            if (r >= 10) return `${Math.round(r)}:1`;
-                            return `${r.toFixed(2)}:1`;
-                          })()
-                        : '-'}
-                    </span>
-                  </span>
-                </div>
+                <>
+                  <div className="flex items-center gap-3 mt-2 flex-wrap">
+                    <Tooltip title="Total input tokens sent to the API across all requests">
+                      <span className="text-[11px] text-text-secondary font-mono cursor-help">
+                        Input Tokens:{' '}
+                        <span className="text-accent-blue">{tokenStats.inputTokens.toLocaleString()}</span>
+                      </span>
+                    </Tooltip>
+                    <Tooltip title="Total output tokens generated by the model across all requests">
+                      <span className="text-[11px] text-text-secondary font-mono cursor-help">
+                        Output Tokens:{' '}
+                        <span className="text-accent-teal">{tokenStats.outputTokens.toLocaleString()}</span>
+                      </span>
+                    </Tooltip>
+                    <Tooltip title="Ratio of input tokens to output tokens — higher means more reading, less generating">
+                      <span className="text-[11px] text-text-secondary font-mono cursor-help">
+                        Ratio (In:Out):{' '}
+                        <span className="text-accent-violet">
+                          {tokenStats.outputTokens > 0 && tokenStats.inputTokens > 0
+                            ? (() => {
+                                const r = tokenStats.inputTokens / tokenStats.outputTokens;
+                                if (r >= 10) return `${Math.round(r)}:1`;
+                                return `${r.toFixed(2)}:1`;
+                              })()
+                            : '-'}
+                        </span>
+                      </span>
+                    </Tooltip>
+                  </div>
+                  {(tokenStats.avgInputThroughput > 0 || tokenStats.avgOutputThroughput > 0) && (
+                    <div className="flex items-center gap-3 mt-1 flex-wrap">
+                      <Tooltip title="Input throughput: concurrency × avg input tokens / avg response time">
+                        <span className="text-[11px] text-text-secondary font-mono cursor-help">
+                          Input T/s:{' '}
+                          <span className="text-accent-blue">{tokenStats.avgInputThroughput.toLocaleString()}</span>
+                        </span>
+                      </Tooltip>
+                      <Tooltip title="Output throughput: concurrency × avg output tokens / avg response time">
+                        <span className="text-[11px] text-text-secondary font-mono cursor-help">
+                          Output T/s:{' '}
+                          <span className="text-accent-teal">{tokenStats.avgOutputThroughput.toLocaleString()}</span>
+                        </span>
+                      </Tooltip>
+                      <Tooltip title="Total throughput: concurrency × avg total tokens / avg response time">
+                        <span className="text-[11px] text-text-secondary font-mono cursor-help">
+                          Total T/s:{' '}
+                          <span className="text-accent-violet">{tokenStats.avgTotalThroughput.toLocaleString()}</span>
+                        </span>
+                      </Tooltip>
+                    </div>
+                  )}
+                </>
               )}
             </div>
           </div>
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "llm-benchmark-backend",`
`3`		`- "version": "2.5.0",`
	`3`	`+ "version": "2.6.0",`
`4`	`4`	`"description": "LLM API Radar - Backend",`
`5`	`5`	`"main": "dist/index.js",`
`6`	`6`	`"scripts": {`
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,7 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "frontend",`
`3`	`3`	`"private": true,`
`4`		`- "version": "2.5.1",`
	`4`	`+ "version": "2.6.0",`
`5`	`5`	`"type": "module",`
`6`	`6`	`"scripts": {`
`7`	`7`	`"dev": "vite",`