JuanToledo23
diff --git a/‎.env.example‎
Lines changed: 2 additions & 0 deletions b/‎.env.example‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 44 additions & 19 deletions b/‎README.md‎
Lines changed: 44 additions & 19 deletions
diff --git a/‎backend/README.md‎
Lines changed: 31 additions & 15 deletions b/‎backend/README.md‎
Lines changed: 31 additions & 15 deletions
diff --git a/‎backend/app/config.py‎
Lines changed: 2 additions & 0 deletions b/‎backend/app/config.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎backend/app/services/ai_service.py‎
Lines changed: 59 additions & 11 deletions b/‎backend/app/services/ai_service.py‎
Lines changed: 59 additions & 11 deletions
@@ -7,6 +7,8 @@ ROCKETS_TTL=86400
 LAUNCHES_TTL=120
 STARLINK_TTL=300
 DASHBOARD_TTL=300
+LAUNCH_LATEST_TTL=120
+LAUNCH_NEXT_TTL=120
 
 # SpaceX client
 SPACEX_TIMEOUT=10
 
@@ -58,7 +58,7 @@ spacex-dashboard/
 │   │   ├── utils/          # Shared calculations
 │   │   ├── config.py       # Environment-based settings
 │   │   └── main.py         # Application entry point
-│   └── tests/              # 203 Pytest tests (96% coverage)
+│   └── tests/              # 208 Pytest tests (96% coverage)
 ├── frontend/               # Vue 3 SPA (TypeScript strict)
 │   ├── src/
 │   │   ├── api/            # Axios HTTP client (17 functions)
@@ -74,8 +74,6 @@ spacex-dashboard/
 │   │   ├── views/          # 11 page components
 │   │   └── __tests__/      # 242 Vitest tests (47 files)
 │   └── package.json
-├── docs/
-│   └── DATA_CONTRACTS.md   # Data models for RAG/LLM indexing
 ├── .github/workflows/
 │   ├── ci.yml              # Lint, type-check, test, coverage, security audit
 │   └── deploy.yml          # Deploy to EC2 via SSH with rollback
@@ -171,21 +169,40 @@ GROQ_API_KEY=your_key_here
 
 Get a free key at [console.groq.com](https://console.groq.com).
 
+### How the AI Gets Context
+
+The AI service uses a **context builder** (`_build_data_context`) that assembles a compact text summary of all SpaceX program data before sending it to the LLM. The context includes:
+
+- **Missions** — Total launches, success rate, launches by year
+- **Fleet** — Active boosters, landings, landing success rate
+- **Starlink** — Total satellites tracked
+- **Rockets** — Per-rocket launch stats and success rates
+- **Emissions** — CO2 by vehicle, annual trends, fuel breakdown, reuse savings
+- **Economics** — Spend by vehicle, annual trends, top customers, mass by orbit
+- **History** — Last 15 milestones
+- **Landing** — Pad stats, RTLS vs ASDS comparison
+- **Launch sites** — Launchpad performance
+- **Roadster** — Starman telemetry (speed, distance, orbit)
+
+When `generate_ai_insights` is called from the dashboard, it receives **prefetched data** (rockets, launches, starlink stats, fleet, launchpads) already fetched for the Overview page, avoiding redundant service calls. For chat and fun-fact, the context builder fetches fresh data from the cached services. All data is formatted with markdown-style section headers for the LLM to parse.
+
 ## Caching Strategy
 
-| Resource   | TTL    | Rationale                              |
-|------------|--------|----------------------------------------|
-| Rockets    | 24 h   | Rarely changes                         |
-| Launches   | 2 min  | Updates frequently around launch events |
-| Starlink   | 5 min  | Large dataset, moderate update rate    |
-| Dashboard  | 5 min  | Aggregated from multiple sources       |
-| Economics  | 5 min  | Derived from launches and rockets      |
-| Emissions  | 5 min  | Derived from launches and rockets      |
-| Cores      | 24 h   | Changes infrequently                   |
-| Launchpads | 24 h   | Static infrastructure data             |
-| History    | 24 h   | Historical events, rarely updated      |
-| Landing    | 24 h   | Pad data changes infrequently          |
-| Roadster   | 24 h   | Telemetry updates slowly               |
+| Resource      | TTL    | Rationale                              |
+|---------------|--------|----------------------------------------|
+| Rockets       | 24 h   | Rarely changes                         |
+| Launches      | 2 min  | Updates frequently around launch events |
+| Starlink      | 5 min  | Large dataset, moderate update rate    |
+| Dashboard     | 5 min  | Full response cached; avoids re-aggregation |
+| Launch latest | 2 min  | Latest completed launch                |
+| Launch next   | 2 min  | Next scheduled launch                  |
+| Economics     | 5 min  | Derived from launches and rockets      |
+| Emissions     | 5 min  | Derived from launches and rockets      |
+| Cores         | 24 h   | Changes infrequently                   |
+| Launchpads    | 24 h   | Static infrastructure data             |
+| History       | 24 h   | Historical events, rarely updated      |
+| Landing       | 24 h   | Pad data changes infrequently          |
+| Roadster      | 24 h   | Telemetry updates slowly               |
 
 **Stampede prevention:** On cache miss, a Redis `SET NX` lock is acquired before calling the SpaceX API. Concurrent requests wait briefly and read from cache once it is populated, avoiding redundant upstream calls.
 
@@ -204,7 +221,7 @@ The project maintains strict quality standards enforced through automated toolin
 
 | Metric | Value |
 |---|---|
-| Total tests | **445** (203 backend + 242 frontend) |
+| Total tests | **450** (208 backend + 242 frontend) |
 | Backend coverage | **96%** (enforced minimum: 90%) |
 | Backend lint errors | **0** (Ruff check + format) |
 | Frontend lint errors | **0** (ESLint, 1 intentional warning for `v-html` in AI chat markdown) |
@@ -222,6 +239,14 @@ The project maintains strict quality standards enforced through automated toolin
 
 The frontend is optimized for fast initial load and smooth navigation.
 
+**Overview load optimizations (backend):**
+
+- **Parallel fetches** — Rockets, launches, Starlink stats, fleet, and launchpads are fetched concurrently via `asyncio.gather`, reducing cold-cache load time by ~40–60%
+- **Prefetched AI context** — When generating insights for the Overview, the AI service receives data already fetched for the dashboard instead of re-fetching, saving ~3–8 seconds
+- **Dashboard cache** — The full `/api/dashboard` response is cached (5 min TTL); subsequent loads return in ~50–200 ms
+- **Latest/next cache** — Latest and next launch endpoints are cached (2 min TTL) to avoid repeated SpaceX API calls
+- **Starlink single request** — Starlink data uses `pagination: false` for one API call instead of 12+ paginated requests
+
 **Lazy loading:**
 
 - All 11 route views use dynamic `import()` for code splitting
@@ -275,7 +300,7 @@ This project was iteratively evaluated and improved through a structured AI-assi
 | Tests & Coverage | 9.8 | 445 tests, 96% backend coverage, 47 frontend test files covering all views/charts |
 | DevOps & CI/CD | 9.8 | Docker healthchecks, coverage enforcement, security scanning, pre-commit hooks |
 | Security | 9.7 | Global rate limiting, prompt-injection sanitization, security.txt, HSTS/CSP headers |
-| Documentation | 9.5 | 5 documentation files, API reference, data contracts, deployment guide |
+| Documentation | 9.5 | 3 README files (project, backend, frontend), API reference, deployment guide |
 | UX/UI & Accessibility | 9.8 | Skip-to-content, focus trap, ARIA on 13 charts, route progress bar, view transitions |
 | Performance | 9.0 | 92% bundle reduction, lazy-loading, deferred animations, chunk splitting |
 | Maintainability | 9.7 | 100% docstrings, pre-commit hooks, coverage thresholds, CI hardening |
@@ -287,7 +312,7 @@ This project was iteratively evaluated and improved through a structured AI-assi
 These numbers are not estimates — they are the output of automated tooling:
 
 ```
-Backend:  203 tests passed | 96.12% coverage | 0 Ruff errors | 80 files formatted
+Backend:  208 tests passed | 96.12% coverage | 0 Ruff errors | 80 files formatted
 Frontend: 242 tests passed | 47 test files   | 0 ESLint errors | 0 type errors
 Bundle:   12.94 KB main | 105 KB vendor-vue | 88 KB vendor-d3 (all gzipped ~50% smaller)
 ```
 
@@ -50,6 +50,16 @@ Each request flows through this pipeline:
 4. On miss, the service acquires a Redis lock (`SET NX`), calls the **SpaceX client**, transforms the response, caches it, and returns
 5. Concurrent requests that arrive during a cache miss wait briefly and read from cache once populated
 
+## Performance (Overview)
+
+The dashboard endpoint is optimized for fast initial load:
+
+- **Parallel fetches** — Rockets, launches, Starlink stats, fleet, and launchpads are fetched concurrently via `asyncio.gather`
+- **Prefetched AI context** — `generate_ai_insights` receives data already fetched for the dashboard instead of re-fetching
+- **Dashboard cache** — The full response is cached (5 min TTL); subsequent loads return from Redis
+- **Latest/next cache** — Latest and next launch are cached (2 min TTL) to avoid repeated SpaceX API calls
+- **Starlink single request** — Uses `pagination: false` for one API call instead of 12+ paginated requests
+
 ## Setup
 
 ### Prerequisites
@@ -86,6 +96,8 @@ The API starts at http://localhost:8000. Interactive docs at http://localhost:80
 | `LAUNCHES_TTL`     | `120`                              | Launches cache TTL             |
 | `STARLINK_TTL`     | `300`                              | Starlink cache TTL             |
 | `DASHBOARD_TTL`    | `300`                              | Dashboard cache TTL            |
+| `LAUNCH_LATEST_TTL`| `120`                              | Latest launch cache TTL (2 min)|
+| `LAUNCH_NEXT_TTL`  | `120`                              | Next launch cache TTL (2 min)  |
 | `CORES_TTL`        | `86400`                            | Cores/fleet cache TTL          |
 | `LAUNCHPADS_TTL`   | `86400`                            | Launchpads cache TTL           |
 | `HISTORY_TTL`      | `86400`                            | History cache TTL              |
@@ -203,7 +215,9 @@ All values can be set via environment variables or a `.env` file. See [.env.exam
 }
 ```
 
-The AI service uses Groq (Llama 3.3 70B) to generate responses grounded in real SpaceX data. The chat context includes data from all dashboard sources: missions, rockets, fleet/booster stats, Starlink satellites, economics, emissions, historical milestones, landing pads, launch sites, and Roadster telemetry. Chat responses are formatted with markdown (bold, lists, paragraphs). The fun-fact endpoint generates a short, surprising curiosity (max ~25 words) that varies on each call. If `GROQ_API_KEY` is not set, the status endpoint returns `{ "available": false }` and the other AI endpoints return a 503 or helpful message.
+The AI service uses Groq (Llama 3.3 70B) to generate responses grounded in real SpaceX data. Chat responses are formatted with markdown (bold, lists, paragraphs). The fun-fact endpoint generates a short, surprising curiosity (max ~25 words) that varies on each call. If `GROQ_API_KEY` is not set, the status endpoint returns `{ "available": false }` and the other AI endpoints return a 503 or helpful message.
+
+**How the AI gets context:** The `_build_data_context` function assembles a compact text summary from all dashboard data sources: missions, rockets, fleet, Starlink, emissions, economics, history, landing pads, launch sites, and Roadster telemetry. When `generate_ai_insights` is called from the dashboard, it receives prefetched data (rockets, launches, starlink stats, fleet, launchpads) already fetched for the Overview, avoiding redundant service calls. For chat and fun-fact, the context builder fetches fresh data from the cached services.
 
 **Input sanitization:** The `ChatRequest` schema enforces a 2,000 character limit on messages and uses a `field_validator` to strip common prompt-injection patterns (e.g., `ignore previous instructions`, `system:`, `[INST]`) before the message reaches the LLM. AI endpoints also have dedicated rate limits: chat is limited to 20 requests per minute and fun-fact to 10 requests per minute.
 
@@ -257,19 +271,21 @@ Every cacheable resource uses the same pattern:
 
 This prevents cache stampedes where many requests would simultaneously hit the upstream API.
 
-| Resource   | TTL    |
-|------------|--------|
-| Rockets    | 24 h   |
-| Launches   | 2 min  |
-| Starlink   | 5 min  |
-| Dashboard  | 5 min  |
-| Economics  | 5 min  |
-| Emissions  | 5 min  |
-| Cores      | 24 h   |
-| Launchpads | 24 h   |
-| History    | 24 h   |
-| Landing    | 24 h   |
-| Roadster   | 24 h   |
+| Resource      | TTL    |
+|---------------|--------|
+| Rockets       | 24 h   |
+| Launches      | 2 min  |
+| Starlink      | 5 min  |
+| Dashboard     | 5 min  |
+| Launch latest | 2 min  |
+| Launch next   | 2 min  |
+| Economics     | 5 min  |
+| Emissions     | 5 min  |
+| Cores         | 24 h   |
+| Launchpads    | 24 h   |
+| History       | 24 h   |
+| Landing       | 24 h   |
+| Roadster      | 24 h   |
 
 ## Testing
 
@@ -283,7 +299,7 @@ pytest --cov=app --cov-report=term-missing
 
 | Metric | Value |
 |---|---|
-| Total tests | **203** |
+| Total tests | **208** |
 | Code coverage | **96.12%** |
 | Enforced minimum | **90%** (`--cov-fail-under=90` in CI) |
 | Test files | 25 (routes, services, cache, middleware, rate_limit, AI, notifications, dev, etc.) |
 
@@ -11,6 +11,8 @@ class Settings(BaseSettings):
     launches_ttl: int = 120  # 2 minutes
     starlink_ttl: int = 300  # 5 minutes
     dashboard_ttl: int = 300  # 5 minutes
+    launch_latest_ttl: int = 120  # 2 minutes
+    launch_next_ttl: int = 120  # 2 minutes
     cores_ttl: int = 86400  # 24 hours (same as rockets)
     launchpads_ttl: int = 86400  # 24 hours
     history_ttl: int = 86400  # 24 hours
 
@@ -65,12 +65,37 @@ def _get_client() -> AsyncGroq:
     return AsyncGroq(api_key=settings.groq_api_key)
 
 
-async def _build_data_context() -> str:
-    """Gather all SpaceX data from cache into a compact text summary for the LLM."""
-    rockets = await rocket_service.get_rockets()
-    all_launches = await launch_service.get_all_launches()
-    starlink_stats = await starlink_service.get_starlink_stats()
-    fleet = await core_service.get_fleet_stats()
+async def _build_data_context(
+    *,
+    prefetched_rockets=None,
+    prefetched_launches=None,
+    prefetched_launches_by_year=None,
+    prefetched_starlink_stats=None,
+    prefetched_fleet=None,
+    prefetched_launchpads=None,
+) -> str:
+    """Gather all SpaceX data from cache into a compact text summary for the LLM.
+    Accepts optional prefetched data to avoid redundant fetches when called from dashboard.
+    """
+    if prefetched_rockets is not None:
+        rockets = prefetched_rockets
+    else:
+        rockets = await rocket_service.get_rockets()
+
+    if prefetched_launches is not None:
+        all_launches = prefetched_launches
+    else:
+        all_launches = await launch_service.get_all_launches()
+
+    if prefetched_starlink_stats is not None:
+        starlink_stats = prefetched_starlink_stats
+    else:
+        starlink_stats = await starlink_service.get_starlink_stats()
+
+    if prefetched_fleet is not None:
+        fleet = prefetched_fleet
+    else:
+        fleet = await core_service.get_fleet_stats()
 
     total = len(all_launches)
     successful = sum(1 for lnch in all_launches if lnch.get("success") is True)
@@ -85,7 +110,10 @@ async def _build_data_context() -> str:
         for r in rockets
     ]
 
-    by_year = await launch_service.get_launches_by_year()
+    if prefetched_launches_by_year is not None:
+        by_year = prefetched_launches_by_year
+    else:
+        by_year = await launch_service.get_launches_by_year()
     year_lines = [
         f"  - {y.year}: {y.total} launches ({y.successes} ok, {y.failures} failed)" for y in by_year
     ]
@@ -210,7 +238,10 @@ async def _build_data_context() -> str:
 
     # Launchpads (launch sites)
     try:
-        launchpads = await launchpad_service.get_launchpads()
+        if prefetched_launchpads is not None:
+            launchpads = prefetched_launchpads
+        else:
+            launchpads = await launchpad_service.get_launchpads()
         lp_lines = [
             f"  - {lp.full_name} ({lp.locality},"
             f" {lp.region}):"
@@ -245,12 +276,29 @@ async def _build_data_context() -> str:
 VALID_DOMAINS = {"missions", "fleet", "economics", "emissions", "starlink", "landing"}
 
 
-async def generate_ai_insights() -> list[Insight] | None:
-    """Generate AI-powered actionable recommendations. Returns None if unavailable."""
+async def generate_ai_insights(
+    *,
+    prefetched_rockets=None,
+    prefetched_launches=None,
+    prefetched_launches_by_year=None,
+    prefetched_starlink_stats=None,
+    prefetched_fleet=None,
+    prefetched_launchpads=None,
+) -> list[Insight] | None:
+    """Generate AI-powered actionable recommendations. Returns None if unavailable.
+    Accepts optional prefetched data from dashboard to avoid redundant service calls.
+    """
     if not _is_available():
         return None
 
-    data_context = await _build_data_context()
+    data_context = await _build_data_context(
+        prefetched_rockets=prefetched_rockets,
+        prefetched_launches=prefetched_launches,
+        prefetched_launches_by_year=prefetched_launches_by_year,
+        prefetched_starlink_stats=prefetched_starlink_stats,
+        prefetched_fleet=prefetched_fleet,
+        prefetched_launchpads=prefetched_launchpads,
+    )
 
     try:
         client = _get_client()