idemerge
diff --git a/‎CHANGELOG.md‎
Lines changed: 16 additions & 0 deletions b/‎CHANGELOG.md‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎backend/src/providers/adapter.ts‎
Lines changed: 14 additions & 0 deletions b/‎backend/src/providers/adapter.ts‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎backend/src/routes/monitor.ts‎
Lines changed: 9 additions & 0 deletions b/‎backend/src/routes/monitor.ts‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎backend/src/routes/playground.ts‎
Lines changed: 18 additions & 3 deletions b/‎backend/src/routes/playground.ts‎
Lines changed: 18 additions & 3 deletions
diff --git a/‎backend/src/services/alertNotifier.ts‎
Lines changed: 192 additions & 0 deletions b/‎backend/src/services/alertNotifier.ts‎
Lines changed: 192 additions & 0 deletions
@@ -4,6 +4,22 @@ All notable changes to this project will be documented in this file.
 
 The format is based on [Keep a Changelog](https://keepachangelog.com/), and this project adheres to [Semantic Versioning](https://semver.org/).
 
+## [2.13.0] - 2026-05-11
+
+### Added
+- Full i18n support with Chinese/English language switcher (react-i18next)
+- Feishu webhook alert notifications for monitor
+  - Per-target alert enable/disable toggle
+  - Status change detection: new failure, repeated failure (configurable interval), recovery
+  - DB-persisted alert state (survives restarts)
+  - Optional webhook signature verification
+  - Configurable notification language (en/zh, default en)
+- Alert bell indicator on monitor model cards (color-coded by health status)
+
+### Changed
+- All hardcoded UI strings replaced with i18n translation keys
+- Monitor settings modal now includes alert configuration section (webhook URL, secret, language, reminder interval)
+
 ## [2.12.1] - 2026-04-28
 
 ### Fixed
 
@@ -149,6 +149,7 @@ export class DynamicProvider extends BaseLLMProvider {
     const inputTokens = data.usage?.prompt_tokens || 0;
     const completionTokens = data.usage?.completion_tokens || 0;
     const reasoningTokens = data.usage?.completion_tokens_details?.reasoning_tokens || 0;
+    const cacheReadTokens = data.usage?.prompt_tokens_details?.cached_tokens || 0;
 
     return {
       text: data.choices?.[0]?.message?.content || '',
@@ -160,6 +161,7 @@ export class DynamicProvider extends BaseLLMProvider {
       firstTokenLatency: 0, // Non-streaming: no TTFT available
       estimatedCost: 0,
       model: this.modelName,
+      ...(cacheReadTokens > 0 && { cacheReadTokens }),
     };
   }
 
@@ -240,6 +242,7 @@ export class DynamicProvider extends BaseLLMProvider {
     const inputTokens = usageData?.prompt_tokens || 0;
     const completionTokens = usageData?.completion_tokens || 0;
     const reasoningTokens = usageData?.completion_tokens_details?.reasoning_tokens || 0;
+    const cacheReadTokens = usageData?.prompt_tokens_details?.cached_tokens || 0;
 
     return {
       text: '',
@@ -250,6 +253,7 @@ export class DynamicProvider extends BaseLLMProvider {
       responseTime,
       firstTokenLatency,
       estimatedCost: 0,
+      ...(cacheReadTokens > 0 && { cacheReadTokens }),
       model: this.modelName,
     };
   }
@@ -291,6 +295,8 @@ export class DynamicProvider extends BaseLLMProvider {
     const responseTime = Date.now() - startTime;
     const inputTokens = data.usage?.input_tokens || 0;
     const outputTokens = data.usage?.output_tokens || 0;
+    const cacheCreationTokens = data.usage?.cache_creation_input_tokens || 0;
+    const cacheReadTokens = data.usage?.cache_read_input_tokens || 0;
 
     return {
       text: data.content?.[0]?.text || '',
@@ -302,6 +308,8 @@ export class DynamicProvider extends BaseLLMProvider {
       firstTokenLatency: 0, // Non-streaming: no TTFT available
       estimatedCost: 0,
       model: this.modelName,
+      ...(cacheCreationTokens > 0 && { cacheCreationTokens }),
+      ...(cacheReadTokens > 0 && { cacheReadTokens }),
     };
   }
 
@@ -342,6 +350,8 @@ export class DynamicProvider extends BaseLLMProvider {
     let buffer = '';
     let inputTokens = 0;
     let outputTokens = 0;
+    let cacheCreationTokens = 0;
+    let cacheReadTokens = 0;
 
     while (true) {
       const { done, value } = await reader.read();
@@ -362,6 +372,8 @@ export class DynamicProvider extends BaseLLMProvider {
           }
           if (parsed.type === 'message_start') {
             inputTokens = parsed.message?.usage?.input_tokens || 0;
+            cacheCreationTokens = parsed.message?.usage?.cache_creation_input_tokens || 0;
+            cacheReadTokens = parsed.message?.usage?.cache_read_input_tokens || 0;
           }
           if (parsed.type === 'message_delta') {
             outputTokens = parsed.usage?.output_tokens || outputTokens;
@@ -388,6 +400,8 @@ export class DynamicProvider extends BaseLLMProvider {
       firstTokenLatency: firstTokenTime ? firstTokenTime - startTime : 0,
       estimatedCost: 0,
       model: this.modelName,
+      ...(cacheCreationTokens > 0 && { cacheCreationTokens }),
+      ...(cacheReadTokens > 0 && { cacheReadTokens }),
     };
   }
 
 
@@ -40,6 +40,15 @@ router.put('/config', validate(MonitorConfigSchema), (req: Request, res: Respons
   const updated: MonitorGlobalConfig = {
     defaultIntervalMinutes: interval,
     healthThresholds: ht,
+    alertWebhookUrl: typeof body.alertWebhookUrl === 'string' ? body.alertWebhookUrl : current.alertWebhookUrl || '',
+    alertReminderMinutes:
+      typeof body.alertReminderMinutes === 'number'
+        ? Math.max(5, Math.min(1440, body.alertReminderMinutes))
+        : current.alertReminderMinutes,
+    alertWebhookSecret:
+      typeof body.alertWebhookSecret === 'string' ? body.alertWebhookSecret : current.alertWebhookSecret || '',
+    alertLanguage:
+      body.alertLanguage === 'zh' || body.alertLanguage === 'en' ? body.alertLanguage : current.alertLanguage || 'en',
   };
   monitorConfigStore.setConfig(updated);
   res.json({ success: true, config: monitorConfigStore.getConfig() });
 
@@ -499,6 +499,7 @@ async function streamOpenAI(
       inputTokens: usageData?.prompt_tokens || 0,
       outputTokens: usageData?.completion_tokens || 0,
       reasoningTokens: usageData?.completion_tokens_details?.reasoning_tokens || 0,
+      cacheReadTokens: usageData?.prompt_tokens_details?.cached_tokens || 0,
     },
     resultOut,
   );
@@ -565,6 +566,8 @@ async function streamAnthropic(
   let reasoningText = '';
   let inputTokens = 0;
   let outputTokens = 0;
+  let cacheCreationTokens = 0;
+  let cacheReadTokens = 0;
 
   try {
     while (true) {
@@ -585,6 +588,8 @@ async function streamAnthropic(
 
           if (parsed.type === 'message_start') {
             inputTokens = parsed.message?.usage?.input_tokens || 0;
+            cacheCreationTokens = parsed.message?.usage?.cache_creation_input_tokens || 0;
+            cacheReadTokens = parsed.message?.usage?.cache_read_input_tokens || 0;
           }
           if (parsed.type === 'content_block_delta') {
             const deltaType = parsed.delta?.type;
@@ -633,6 +638,8 @@ async function streamAnthropic(
       inputTokens,
       outputTokens,
       reasoningTokens: reasoningText.length > 0 ? Math.ceil(reasoningText.length / 4) : 0,
+      cacheCreationTokens,
+      cacheReadTokens,
     },
     resultOut,
   );
@@ -813,16 +820,22 @@ function emitDone(
   modelName: string,
   fullText: string,
   reasoningText: string,
-  tokens: { inputTokens: number; outputTokens: number; reasoningTokens: number },
+  tokens: {
+    inputTokens: number;
+    outputTokens: number;
+    reasoningTokens: number;
+    cacheCreationTokens?: number;
+    cacheReadTokens?: number;
+  },
   resultOut?: StreamResult,
 ) {
   if (isAborted()) return;
   const responseTime = Date.now() - startTime;
   const firstTokenLatency = firstTokenTime ? firstTokenTime - startTime : 0;
-  const { inputTokens, outputTokens, reasoningTokens } = tokens;
+  const { inputTokens, outputTokens, reasoningTokens, cacheCreationTokens, cacheReadTokens } = tokens;
   const tokensPerSecond = outputTokens > 0 ? Math.round((outputTokens / responseTime) * 1000) : 0;
 
-  const doneEvent = {
+  const doneEvent: Record<string, any> = {
     type: 'done',
     text: fullText,
     reasoningText,
@@ -835,6 +848,8 @@ function emitDone(
     tokensPerSecond,
     model: modelName,
   };
+  if (cacheCreationTokens) doneEvent.cacheCreationTokens = cacheCreationTokens;
+  if (cacheReadTokens) doneEvent.cacheReadTokens = cacheReadTokens;
   sendEvent(doneEvent);
 
   if (resultOut) {
 
@@ -0,0 +1,192 @@
+import crypto from 'crypto';
+import { getDb } from './database';
+import { monitorConfigStore, MonitorTarget } from './monitorConfigStore';
+import { HealthStatus } from './monitorStore';
+
+type AlertType = 'down' | 'reminder' | 'recovery';
+
+interface AlertMetrics {
+  latencyMs: number;
+  ttftMs: number;
+  outputTokens: number;
+  errorMessage?: string;
+}
+
+/** Get the previous health status for a target (skip the just-inserted ping) */
+function getPreviousStatus(providerId: string, modelName: string): HealthStatus | null {
+  const db = getDb();
+  const row = db
+    .prepare(
+      `SELECT health_status FROM monitor_pings
+       WHERE provider_id = ? AND model_name = ?
+       ORDER BY checked_at DESC LIMIT 1 OFFSET 1`,
+    )
+    .get(providerId, modelName) as { health_status: HealthStatus } | undefined;
+  return row?.health_status ?? null;
+}
+
+/** Determine if an alert should be sent */
+function shouldSendAlert(
+  target: MonitorTarget,
+  currentStatus: HealthStatus,
+  reminderMinutes: number,
+): { send: boolean; type: AlertType } | null {
+  const previousStatus = getPreviousStatus(target.providerId, target.modelName);
+
+  if (!previousStatus) return null;
+
+  const wasDown = previousStatus === 'down';
+  const isDown = currentStatus === 'down' || currentStatus === 'very_slow';
+
+  if (wasDown && !isDown) {
+    return { send: true, type: 'recovery' };
+  }
+
+  if (!wasDown && isDown) {
+    return { send: true, type: 'down' };
+  }
+
+  if (isDown) {
+    const lastAlertAt = target.lastAlertAt;
+    if (!lastAlertAt) {
+      return { send: true, type: 'reminder' };
+    }
+    const elapsed = Date.now() - new Date(lastAlertAt).getTime();
+    if (elapsed >= reminderMinutes * 60 * 1000) {
+      return { send: true, type: 'reminder' };
+    }
+  }
+
+  return null;
+}
+
+/** Generate Feishu webhook signature — appends timestamp & sign as URL params */
+function buildSignedUrl(webhookUrl: string, secret: string): string {
+  const timestamp = Math.floor(Date.now() / 1000).toString();
+  const stringToSign = `${timestamp}\n${secret}`;
+  const hmac = crypto.createHmac('sha256', stringToSign);
+  hmac.update('');
+  const sign = hmac.digest('base64');
+  const sep = webhookUrl.includes('?') ? '&' : '?';
+  return `${webhookUrl}${sep}timestamp=${timestamp}&sign=${encodeURIComponent(sign)}`;
+}
+
+/** Localized alert content */
+function getAlertContent(lang: 'en' | 'zh', type: AlertType, target: MonitorTarget, metrics: AlertMetrics) {
+  const isZh = lang === 'zh';
+  const tps = metrics.latencyMs > 0 ? ((metrics.outputTokens / metrics.latencyMs) * 1000).toFixed(1) : '0';
+
+  const colors: Record<AlertType, string> = { down: 'red', reminder: 'orange', recovery: 'green' };
+
+  const titles: Record<AlertType, string> = isZh
+    ? { down: '🚨 监控告警：服务异常', reminder: '⚠️ 监控提醒：服务仍异常', recovery: '✅ 监控恢复：服务已恢复' }
+    : {
+        down: '🚨 Monitor Alert: Service Down',
+        reminder: '⚠️ Monitor Reminder: Still Down',
+        recovery: '✅ Monitor Recovery: Service Restored',
+      };
+
+  const providerLabel = isZh ? '服务商' : 'Provider';
+  const modelLabel = isZh ? '模型' : 'Model';
+  const latencyLabel = isZh ? '延迟' : 'Latency';
+  const errorLabel = isZh ? '错误' : 'Error';
+  const timeLabel = isZh ? '时间' : 'Time';
+
+  const elements = [
+    {
+      tag: 'div',
+      text: {
+        tag: 'lark_md',
+        content: `**${providerLabel}:** ${target.providerName}\n**${modelLabel}:** ${target.modelName}`,
+      },
+    },
+  ];
+
+  if (type === 'recovery') {
+    elements.push({
+      tag: 'div',
+      text: {
+        tag: 'lark_md',
+        content: `**${latencyLabel}:** ${metrics.latencyMs}ms | **TPS:** ${tps} | **TTFT:** ${metrics.ttftMs}ms`,
+      },
+    });
+  } else {
+    const details = [
+      `**${latencyLabel}:** ${metrics.latencyMs}ms`,
+      `**TTFT:** ${metrics.ttftMs}ms`,
+      `**Tokens:** ${metrics.outputTokens}`,
+    ];
+    if (metrics.errorMessage) details.push(`**${errorLabel}:** ${metrics.errorMessage}`);
+    elements.push({ tag: 'div', text: { tag: 'lark_md', content: details.join('\n') } });
+  }
+
+  elements.push({
+    tag: 'div',
+    text: { tag: 'plain_text', content: `${timeLabel}: ${new Date().toISOString()}` },
+  });
+
+  return { color: colors[type], title: titles[type], elements };
+}
+
+/** Send alert to Feishu webhook */
+async function sendFeishuAlert(
+  webhookUrl: string,
+  secret: string | undefined,
+  lang: 'en' | 'zh',
+  type: AlertType,
+  target: MonitorTarget,
+  metrics: AlertMetrics,
+): Promise<void> {
+  const { color, title, elements } = getAlertContent(lang, type, target, metrics);
+
+  const bodyStr = JSON.stringify({
+    msg_type: 'interactive',
+    card: {
+      header: { title: { tag: 'plain_text', content: title }, template: color },
+      elements,
+    },
+  });
+
+  const targetUrl = secret ? buildSignedUrl(webhookUrl, secret) : webhookUrl;
+  const res = await fetch(targetUrl, {
+    method: 'POST',
+    headers: { 'Content-Type': 'application/json' },
+    body: bodyStr,
+  });
+
+  if (!res.ok) {
+    const text = await res.text().catch(() => '');
+    console.error(`[Alert] Feishu webhook failed (${res.status}): ${text}`);
+  }
+}
+
+/** Main entry: check and send alert if needed */
+export async function processAlert(
+  target: MonitorTarget,
+  currentStatus: HealthStatus,
+  metrics: AlertMetrics,
+): Promise<void> {
+  if (target.alertEnabled === false) return;
+
+  const config = monitorConfigStore.getConfig();
+  const webhookUrl = config.alertWebhookUrl;
+  if (!webhookUrl) return;
+
+  const reminderMinutes = config.alertReminderMinutes ?? 360;
+  const decision = shouldSendAlert(target, currentStatus, reminderMinutes);
+  if (!decision) return;
+
+  try {
+    await sendFeishuAlert(
+      webhookUrl,
+      config.alertWebhookSecret || undefined,
+      config.alertLanguage || 'en',
+      decision.type,
+      target,
+      metrics,
+    );
+    monitorConfigStore.updateLastAlertAt(target.providerId, target.modelName);
+  } catch (err) {
+    console.error('[Alert] Failed to send notification:', err);
+  }
+}