Uma funcionalidade importante que pode ser feita agora, esta relacionado as noticias, ao listar, (vibe-kanban ba018684)

ktfth · ktfth · commit 93c7aba45fd2 · 2026-03-31T14:33:40.000-03:00
pode ser interessante de "Enter" abrir no browser, mas CTRL + Enter fazer o crawler e ler diretamente na assistente. Faça com consistência
diff --git a/src/index.ts b/src/index.ts
@@ -20,7 +20,7 @@ import { loadPlugins, pluginsToTools, formatPluginList, getPluginDir } from './p
 import { formatApprovalPrompt, formatEditDiff } from './approval'
 import { extractImages, extractFiles } from './images'
 import { openApp, openFile, openUrl, getRunningApps, getSystemInfo, getDateTimeInfo, getOutlookEvents, getKnownApps } from './windows'
-import { fetchNews, fetchNewsItems, getNewsCategories, initNews, addNewsFeed, removeNewsFeed, disableNewsFeed, enableNewsFeed, listNewsFeeds, type NewsCategory, type NewsItem } from './news'
+import { fetchNews, fetchNewsItems, fetchNewsContent, getNewsCategories, initNews, addNewsFeed, removeNewsFeed, disableNewsFeed, enableNewsFeed, listNewsFeeds, type NewsCategory, type NewsItem } from './news'
 import { generateBriefing, getTimeContext, type TimeContext, type PersonaMode } from './briefing'
 import { initTasks, stopTasks, addTask, completeTask, removeTask, listTasks, formatTaskList, parseTime, type Task } from './tasks'
 import { initPeople, addPerson, findPerson, listPeople, logInteraction, delegateTask, getDelegations, getPendingFollowUps, markFollowUpDone, formatPeopleList, formatPersonDetail, formatDelegationList, formatFollowUps, generatePeopleDashboard, type PersonGroup, type InteractionType } from './people'
@@ -1087,11 +1087,28 @@ async function runInteractive(
               : '',
           }))
 
-          const selectedLink = await tui.promptNewsPicker(pickerEntries)
-          if (selectedLink) {
-            const { openUrl } = await import('./windows')
-            openUrl(selectedLink)
-            tui.showSystem(`Abrindo: ${selectedLink}`)
+          const result = await tui.promptNewsPicker(pickerEntries)
+          if (result) {
+            if (result.action === 'open') {
+              // Open in browser
+              const { openUrl } = await import('./windows')
+              openUrl(result.link)
+              tui.showSystem(`Abrindo: ${result.link}`)
+            } else if (result.action === 'read') {
+              // Fetch and display content
+              tui.showSystem(`Buscando conteudo...`)
+              const content = await fetchNewsContent(result.link)
+              if (typeof content === 'string') {
+                tui.showError(content)
+              } else {
+                // Send content to assistant for summarization
+                const newsContext = `Noticia: ${content.title}\nFonte: ${result.link}\n\n${content.content}`
+                const prompt = `Por favor, resuma esta noticia de forma objetiva e destaque os pontos principais:\n\n${newsContext}`
+                tui.enableInput()
+                handleSubmit(prompt)
+                return
+              }
+            }
           }
         } catch (err) {
           tui.showError(`Falha ao buscar noticias: ${err instanceof Error ? err.message : String(err)}`)
diff --git a/src/news.ts b/src/news.ts
@@ -584,3 +584,206 @@ export function getNewsCategories(): string {
   const categories = [...new Set(active.map((f) => f.category))].sort()
   return `Categorias: ${categories.join(', ')}\nUso: /news [categoria]`
 }
+
+// ─── News Content Fetcher ───────────────────────────────────
+
+const CONTENT_FETCH_TIMEOUT_MS = 15_000
+const MAX_CONTENT_BYTES = 5 * 1024 * 1024 // 5 MB
+
+/**
+ * Fetch and extract the main content from a news article URL.
+ * Returns a cleaned, readable text version of the article.
+ */
+export async function fetchNewsContent(url: string): Promise<{ title: string; content: string } | string> {
+  // Validate URL
+  if (!url.startsWith('http://') && !url.startsWith('https://')) {
+    return 'Error: URL invalida'
+  }
+
+  const controller = new AbortController()
+  const timeout = setTimeout(() => controller.abort(), CONTENT_FETCH_TIMEOUT_MS)
+
+  try {
+    const resp = await fetch(url, {
+      signal: controller.signal,
+      headers: {
+        'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
+        'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
+        'Accept-Language': 'pt-BR,pt;q=0.9,en;q=0.8',
+      },
+    })
+    clearTimeout(timeout)
+
+    if (!resp.ok) {
+      return `Error: HTTP ${resp.status}`
+    }
+
+    // Check content-length
+    const contentLength = resp.headers.get('content-length')
+    if (contentLength && Number(contentLength) > MAX_CONTENT_BYTES) {
+      return 'Error: pagina muito grande'
+    }
+
+    // Read body with size cap
+    const reader = resp.body?.getReader()
+    if (!reader) {
+      return 'Error: sem corpo de resposta'
+    }
+
+    const chunks: Uint8Array[] = []
+    let totalBytes = 0
+
+    while (true) {
+      const { done, value } = await reader.read()
+      if (done) break
+      totalBytes += value.byteLength
+      if (totalBytes > MAX_CONTENT_BYTES) {
+        reader.cancel()
+        return 'Error: pagina muito grande'
+      }
+      chunks.push(value)
+    }
+
+    const raw = Buffer.concat(chunks)
+    const contentType = resp.headers.get('content-type')
+    const html = decodeHtml(raw, contentType)
+
+    // Extract article content
+    const extracted = extractArticleContent(html)
+    return extracted
+
+  } catch (err) {
+    clearTimeout(timeout)
+    if (err instanceof Error) {
+      if (err.name === 'AbortError') {
+        return 'Error: timeout ao buscar pagina'
+      }
+      return `Error: ${err.message.slice(0, 100)}`
+    }
+    return 'Error: falha ao buscar pagina'
+  }
+}
+
+/**
+ * Decode HTML bytes using the correct charset.
+ */
+function decodeHtml(raw: Buffer, contentType: string | null): string {
+  const encoding = detectHtmlEncoding(raw, contentType)
+  try {
+    return new TextDecoder(encoding).decode(raw)
+  } catch {
+    try {
+      return new TextDecoder('latin1').decode(raw)
+    } catch {
+      return new TextDecoder('utf-8', { fatal: false }).decode(raw)
+    }
+  }
+}
+
+/**
+ * Detect encoding from Content-Type header or meta charset.
+ */
+function detectHtmlEncoding(raw: Buffer, contentType: string | null): string {
+  // 1) HTTP Content-Type header
+  if (contentType) {
+    const match = contentType.match(/charset\s*=\s*["']?([^\s;"']+)/i)
+    if (match) return normalizeEncoding(match[1])
+  }
+
+  // 2) Meta charset in HTML (first 2KB)
+  const head = raw.subarray(0, 2048).toString('ascii')
+  const metaMatch = head.match(/<meta[^>]+charset\s*=\s*["']?([^"'\s>]+)/i)
+  if (metaMatch) return normalizeEncoding(metaMatch[1])
+
+  // 3) XML-style declaration
+  const xmlMatch = head.match(/<\?xml[^?]+encoding\s*=\s*["']([^"']+)["']/i)
+  if (xmlMatch) return normalizeEncoding(xmlMatch[1])
+
+  return 'utf-8'
+}
+
+/**
+ * Extract readable article content from HTML.
+ * Uses heuristics to find the main article body.
+ */
+function extractArticleContent(html: string): { title: string; content: string } {
+  // Extract title
+  const titleMatch = html.match(/<title[^>]*>([^<]+)<\/title>/i)
+    || html.match(/<h1[^>]*>([^<]+)<\/h1>/i)
+    || html.match(/<meta[^>]+property="og:title"[^>]+content="([^"]+)"/i)
+  const title = titleMatch ? cleanHtml(titleMatch[1]) : 'Sem titulo'
+
+  // Try to find article content using common patterns
+  let articleHtml = ''
+
+  // Strategy 1: Look for <article> tag
+  const articleMatch = html.match(/<article[^>]*>([\s\S]*?)<\/article>/i)
+  if (articleMatch) {
+    articleHtml = articleMatch[1]
+  }
+
+  // Strategy 2: Look for common content containers
+  if (!articleHtml) {
+    const patterns = [
+      /<div[^>]+class="[^"]*(?:article-body|post-content|entry-content|story-body|content-body|article-content|news-content|materia-corpo)[^"]*"[^>]*>([\s\S]*?)<\/div>/i,
+      /<div[^>]+itemprop="articleBody"[^>]*>([\s\S]*?)<\/div>/i,
+      /<main[^>]*>([\s\S]*?)<\/main>/i,
+    ]
+    for (const pattern of patterns) {
+      const match = html.match(pattern)
+      if (match) {
+        articleHtml = match[1]
+        break
+      }
+    }
+  }
+
+  // Strategy 3: Extract all paragraphs as fallback
+  if (!articleHtml) {
+    const paragraphs: string[] = []
+    const pRegex = /<p[^>]*>([\s\S]*?)<\/p>/gi
+    let pMatch: RegExpExecArray | null
+    while ((pMatch = pRegex.exec(html)) !== null) {
+      const text = cleanHtml(pMatch[1]).trim()
+      // Filter out short paragraphs (likely navigation, ads)
+      if (text.length > 50) {
+        paragraphs.push(text)
+      }
+    }
+    articleHtml = paragraphs.join('\n\n')
+  } else {
+    // Clean extracted article HTML
+    articleHtml = extractParagraphs(articleHtml)
+  }
+
+  // Clean and format content
+  const content = articleHtml.trim() || 'Nao foi possivel extrair o conteudo do artigo.'
+
+  return { title, content }
+}
+
+/**
+ * Extract paragraphs from HTML content block.
+ */
+function extractParagraphs(html: string): string {
+  const paragraphs: string[] = []
+  const pRegex = /<p[^>]*>([\s\S]*?)<\/p>/gi
+  let match: RegExpExecArray | null
+
+  while ((match = pRegex.exec(html)) !== null) {
+    const text = cleanHtml(match[1]).trim()
+    if (text.length > 20) { // Skip very short paragraphs
+      paragraphs.push(text)
+    }
+  }
+
+  // If no paragraphs found, try to extract text directly
+  if (paragraphs.length === 0) {
+    const cleanedText = cleanHtml(html).trim()
+    if (cleanedText.length > 50) {
+      return cleanedText
+    }
+  }
+
+  return paragraphs.join('\n\n')
+}
diff --git a/src/tui.ts b/src/tui.ts
@@ -716,18 +716,20 @@ export class TUI {
   // ── News Picker ────────────────────────────────────────────
 
   /**
-   * Interactive news picker. Navigate with W/S or arrows, Enter to open in browser.
-   * Returns the selected item's link or null if cancelled.
+   * Interactive news picker. Navigate with W/S or arrows.
+   * - Enter: open in browser
+   * - Ctrl+Enter: fetch and read content in assistant
+   * Returns NewsPickerResult or null if cancelled.
    */
   promptNewsPicker(
     items: NewsPickerEntry[],
-  ): Promise<string | null> {
+  ): Promise<NewsPickerResult | null> {
     if (items.length === 0) {
       this.showSystem('Nenhuma noticia encontrada.')
       return Promise.resolve(null)
     }
 
-    return new Promise<string | null>((resolve) => {
+    return new Promise<NewsPickerResult | null>((resolve) => {
       this.pickerActive = true
       let cursor = 0
       let filter = ''
@@ -832,10 +834,10 @@ export class TUI {
         const hintRow = this.height - footerH
         w(A.to(hintRow, 1))
         w(A.clearLine)
-        w(`  ${A.dim}W/S or \u2191\u2193 navigate  Enter open  Esc cancel  / filter  Tab category${A.reset}`)
+        w(`  ${A.dim}↑↓ navegar  Enter abrir  Ctrl+Enter ler aqui  Esc cancelar  / filtrar  Tab categoria${A.reset}`)
       }
 
-      const cleanup = (result: string | null): void => {
+      const cleanup = (result: NewsPickerResult | null): void => {
         this.pickerActive = false
         process.stdin.removeListener('data', handler)
         this.renderAll()
@@ -846,7 +848,7 @@ export class TUI {
         const key = data.toString('utf-8')
         const list = filtered()
 
-        // Esc
+        // Esc (bare escape, not part of sequence)
         if (key === '\x1b' && data.length === 1) {
           if (filterMode) {
             filterMode = false
@@ -864,10 +866,19 @@ export class TUI {
           return
         }
 
-        // Enter — open link
+        // Ctrl+Enter (Ctrl+J = \x0a or some terminals send \x1b\r or similar)
+        // Common Ctrl+Enter sequences: \x0a (Ctrl+J), \x1b\r, \x1bOM
+        if (key === '\x0a' || key === '\x1b\r' || key === '\x1bOM') {
+          if (list.length > 0 && cursor < list.length) {
+            cleanup({ action: 'read', link: list[cursor].link })
+          }
+          return
+        }
+
+        // Regular Enter — open in browser
         if (key === '\r' || key === '\n') {
           if (list.length > 0 && cursor < list.length) {
-            cleanup(list[cursor].link)
+            cleanup({ action: 'open', link: list[cursor].link })
           }
           return
         }
@@ -1961,6 +1972,10 @@ export interface NewsPickerEntry {
   time: string    // formatted time string e.g. "21:30"
 }
 
+export type NewsPickerResult =
+  | { action: 'open'; link: string }    // Enter: open in browser
+  | { action: 'read'; link: string }    // Ctrl+Enter: fetch and read content
+
 function formatPickerAge(timestamp: number): string {
   const diff = Date.now() - timestamp
   const secs = Math.floor(diff / 1000)
diff --git a/tests/news.test.ts b/tests/news.test.ts
@@ -4,7 +4,7 @@ import { join } from 'node:path'
 import { tmpdir } from 'node:os'
 import {
   getNewsCategories, initNews, addNewsFeed, removeNewsFeed,
-  disableNewsFeed, enableNewsFeed, listNewsFeeds,
+  disableNewsFeed, enableNewsFeed, listNewsFeeds, fetchNewsContent,
 } from '../src/news'
 
 const TEST_DIR = join(tmpdir(), `smolerclaw-news-test-${Date.now()}`)
@@ -191,3 +191,35 @@ describe('news — feed management', () => {
     expect(removeNewsFeed('myfeed')).toBe(true)
   })
 })
+
+describe('news — fetchNewsContent', () => {
+  test('fetchNewsContent rejects invalid URL', async () => {
+    const result = await fetchNewsContent('ftp://example.com')
+    expect(typeof result).toBe('string')
+    expect(result).toContain('URL invalida')
+  })
+
+  test('fetchNewsContent rejects javascript: URL', async () => {
+    const result = await fetchNewsContent('javascript:alert(1)')
+    expect(typeof result).toBe('string')
+    expect(result).toContain('URL invalida')
+  })
+
+  test('fetchNewsContent handles unreachable host', async () => {
+    const result = await fetchNewsContent('https://this-domain-does-not-exist-12345.test/')
+    expect(typeof result).toBe('string')
+    expect(result).toContain('Error')
+  })
+
+  test('fetchNewsContent returns title and content for valid article', async () => {
+    // Use a simple, stable public page for testing
+    const result = await fetchNewsContent('https://example.com')
+    // Should either succeed or return an error string
+    if (typeof result === 'string') {
+      expect(result).toContain('Error')
+    } else {
+      expect(result).toHaveProperty('title')
+      expect(result).toHaveProperty('content')
+    }
+  })
+})